Spaces:

TTsamurai
/

FinPersona_ECIR

Sleeping

App Files Files Community

TTsamurai commited on Mar 24

Commit

edf52d9

0 Parent(s):

first commit

Browse files

Files changed (49) hide show

.DS_Store +0 -0
.gitattributes +35 -0
.gitignore +164 -0
.python-version +1 -0
README.md +13 -0
_static/html/evaluation_instruction.html +21 -0
_static/html/final_evaluation.html +36 -0
_static/html/general_instruction.html +27 -0
_static/html/instruction_page.html +55 -0
_static/html/system_instruction_preference_elicitation.html +21 -0
_static/html/user_narrative.html +8 -0
_static/txt/general_instruction_button.txt +1 -0
_static/txt/general_instruction_task.txt +1 -0
_static/txt/personality_ext.txt +1 -0
_static/txt/personality_int.txt +1 -0
_static/txt/system_instruction_non_personalization.txt +1 -0
_static/txt/system_instruction_personality.txt +1 -0
_static/txt/system_instruction_personalization.txt +1 -0
_static/txt/system_instruction_preference_elicitation.txt +5 -0
_static/txt/system_instruction_preference_elicitation_personality.txt +5 -0
_static/txt/system_summarization_user_preference_elicitation.txt +1 -0
app.py +1392 -0
components/chat_conversation.py +173 -0
components/constant.py +19 -0
components/induce_personality.py +34 -0
components/prompt.py +10 -0
components/query_rewriting.py +60 -0
components/rag_components.py +190 -0
components/rewrite_passages.py +94 -0
data/single_stock_data/experiment_processed_data.jsonl +3 -0
data/single_stock_data/single_stock_demo.jsonl +0 -0
dum.txt +352 -0
experiments/experiment_with_api_without_personalization.py +665 -0
experiments/personality_simulation.py +60 -0
experiments/separate_preference_elicitation_and_interaction.py +851 -0
experiments/single_stock_experiment.py +574 -0
requirements.txt +3 -0
user_feedback/interaction_3a48b93b-0de7-4e2a-b779-8f1f0c27af24_first.json +2 -0
user_feedback/interaction_462c2c52-b14f-44f1-8030-6f06d5a7d925_first.json +2 -0
user_feedback/interaction_7017b92d-6932-4d3a-b189-1267c2386995_first.json +2 -0
user_feedback/interaction_7e25ac2e-3849-4817-9ae3-e883bca2fb10_first.json +4 -0
user_feedback/interaction_8611c342-840f-4529-b9ff-d1dabb754ded_first.json +6 -0
user_feedback/interaction_8e1566fb-6de9-46da-a3de-c6a580fb5b83_first.json +2 -0
user_feedback/interaction_abfb0425-8dff-4b63-91d0-372276758a8f_first.json +4 -0
user_feedback/interaction_b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea_first.json +16 -0
user_feedback/interaction_d34ca619-e30a-4267-9538-cc8f99aff079.json +4 -0
user_feedback/interaction_e7f30c05-4668-4b35-a706-ba27b7c0a0a9_first.json +2 -0
user_feedback/summarization_8611c342-840f-4529-b9ff-d1dabb754ded_first.json +1 -0
user_feedback/summarization_d34ca619-e30a-4267-9538-cc8f99aff079.json +1 -0

.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

.gitattributes ADDED Viewed

	@@ -0,0 +1,35 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,164 @@

+log/
+old_user_feedback/
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+# C extensions
+*.so
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+# Translations
+*.mo
+*.pot
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+# Flask stuff:
+instance/
+.webassets-cache
+# Scrapy stuff:
+.scrapy
+# Sphinx documentation
+docs/_build/
+# PyBuilder
+.pybuilder/
+target/
+# Jupyter Notebook
+.ipynb_checkpoints
+# IPython
+profile_default/
+ipython_config.py
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
+.pdm.toml
+.pdm-python
+.pdm-build/
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+# SageMath parsed files
+*.sage.py
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+# Spyder project settings
+.spyderproject
+.spyproject
+# Rope project settings
+.ropeproject
+# mkdocs documentation
+/site
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+# Pyre type checker
+.pyre/
+# pytype static type analyzer
+.pytype/
+# Cython debug symbols
+cython_debug/
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/

.python-version ADDED Viewed

	@@ -0,0 +1 @@


1	+ 3.9.7

README.md ADDED Viewed

	@@ -0,0 +1,13 @@

+---
+title: UserStudyFinancialAdvisor
+emoji: 💻
+colorFrom: pink
+colorTo: pink
+sdk: gradio
+sdk_version: 4.44.1
+app_file: app.py
+pinned: false
+license: mit
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

_static/html/evaluation_instruction.html ADDED Viewed

	@@ -0,0 +1,21 @@

+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <h2 style="color: #2c3e50; text-align: center;">Evaluation Instructions</h2>
+    <p style="font-size: 16px; color: #34495e; line-height: 1.6;">
+      Welcome to the evaluation process! Please follow the steps below to complete your evaluation:
+    </p>
+    <ol style="font-size: 16px; color: #34495e; line-height: 1.8;">
+      <!-- <li><strong>Decision Making:</strong>Please respond with either <strong>Yes</strong> or <strong>No</strong> to the question: "Would you like to purchase the stock?"</li> -->
+      <!-- <li><strong>Reason:</strong> Write down the reason for your choice in the free text box labeled "The reason of your choice".</li> -->
+      <!-- <li><strong>A simple recall question:</strong>Which company were you discussing?</li> -->
+      <li><strong>Evaluation Criteria:</strong> Please evaluate the system in the following aspects:
+        <ul>
+          <li><strong>Likelihood of Purchase:</strong> Rate the likelihood of purchase.</li>
+          <li><strong>Reason:</strong> Write down the reason for your choice in the free text box labeled "The reason of your choice".</li>
+          <li><strong>Confidence in Your Decision:</strong> Rate the confidence in your decision.</li>
+          <li><strong>Familiarity Level</strong>:</strong> Rate your familiarity with the stock before the interaction.</li>
+        </ul>
+      </li>
+      <li>After completing all the evaluation criteria, <strong>click the "Send: Evaluation" button</strong> to submit your responses. <strong>Once you submit, you cannot resubmit, so please review your answers carefully before submitting.</strong></li>
+    </ol>
+  </div>

_static/html/final_evaluation.html ADDED Viewed

	@@ -0,0 +1,36 @@

+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <!-- Heading -->
+    <h2 style="color: #2c3e50; text-align: center; margin-bottom: 20px; font-size: 20px; font-weight: 600;">
+        Instruction: Final Evaluation
+    </h2>
+    <!-- User Instruction -->
+    <p style="text-align: left; font-size: 16px; color: #34495e; margin-bottom: 20px;">
+        In the final evaluation, you will first rank the individual stocks below based on your discussion with your financial advisor, according to your desire to invest in each one. Use the following guidelines to assign a unique rank to each stock:
+    </p>
+    <!-- Ranking Instructions List -->
+    <ul style="font-size: 16px; color: #34495e; margin-left: 20px; margin-bottom: 20px;">
+        <li><strong>Rank 1:</strong> The stock you are most eager to invest in.</li>
+        <li><strong>Rank 2:</strong> The second most preferred stock for investment.</li>
+        <!-- <li><strong>Rank 3:</strong> A stock you are moderately interested in investing in.</li> -->
+        <li><strong>Rank 3:</strong> The second least preferred stock for investment.</li>
+        <li><strong>Rank 4:</strong> The stock you are least likely to invest in.</li>
+        <!-- <li><strong>Rank 5:</strong> The stock you are least likely to invest in.</li> -->
+    </ul>
+    <!-- Important Note -->
+    <p style="text-align: left; font-size: 16px; color: #e74c3c; margin-bottom: 20px;">
+        <strong>Important:</strong> Each stock must receive a different rank (from 1 to 4), and no two stocks can share the same rank.
+    </p>
+    <p style="text-align: left; font-size: 16px; color: #34495e; margin-bottom: 20px;">
+        Then, evaluate the advisor by choosing a number between <strong style="color:red;">1 (Strongly Disagree)</strong> and <strong style="color:green;">7 (Strongly Agree)</strong> for each statement.
+    </p>
+    <!-- Final Instruction -->
+    <p style="text-align: left; font-size: 16px; color: #34495e;">
+        After assigning a rank to each stock and evaluating the advisor, click the <strong>"Submit Ranking"</strong> button to submit your evaluation.
+    </p>
+</div>

_static/html/general_instruction.html ADDED Viewed

	@@ -0,0 +1,27 @@

+<!-- Grouped Container for Task Instruction and Stock Information -->
+<!-- Grouped Container for Task Instruction and Stock Information -->
+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <!-- Heading -->
+    <h2 style="color: #2c3e50; text-align: center; margin-bottom: 20px; font-size: 20px; font-weight: 600;">
+        Instruction: Financial Decision Stage
+    </h2>
+    <!-- User Instruction -->
+    <p style="text-align: left; font-size: 16px; color: #34495e; margin-bottom: 20px;">
+        <div>
+            <p>It is December 31, 2023. You are an investor interested in purchasing individual stocks. You understand and accept the risks involved, and you’ve come to consult a financial advisor for guidance on which individual stocks might suit your needs.</p>
+            <p>In this experiment, you will be presented with one stock per round over four rounds (a total of four stocks). For each stock, engage with the financial advisor to determine whether the stock is suitable for your needs or not. If you come across unfamiliar financial concepts or don’t fully understand what the financial advisor says, <strong>feel free to ask questions for clarification</strong>.</p>
+            Once <strong>you feel that you have gathered enough information to make a financial decision, you can move on to the evaluation phase</strong>.
+            Remember, the candidate stock has been <strong>randomly</strong> selected for this exploration and is <strong>not a recommendation</strong> from the financial advisor.
+            <!-- <p>If you don’t have a strong preference about certain characteristics of the stock, <span style="background-color: yellow;">you may simply state, “I don’t have a preference on this dimension.”</span></p> -->
+            <p>To interact with the financial advisor, first push the <strong>Start Conversation</strong> button. Then, type your message in the <strong>User Input</strong> textbox and press the <strong>Send This Message to Advisor</strong> button. If the response from the financial advisor is cut off due to word limitations, press the <strong>Show More of the Advisor’s Answer</strong> button to have the advisor continue the conversation. If you already have enough information to make a decision, you don’t need to press the <strong>Show More of the Advisor’s Answer</strong> button.</p>
+            <p>You will go through four rounds of financial decisions. Each round consists of a “Discussion (Discuss)” and an “Evaluation (Eval)” phase. Please move through the following sequence: 1-1: Discuss → 1-2: Eval → 2-1: Discuss → 2-2: Eval → … → 4-2: Eval.</p>
+        </div>
+    </p>
+</div>

_static/html/instruction_page.html ADDED Viewed

	@@ -0,0 +1,55 @@

+<div style="font-family: Arial, sans-serif; line-height: 1.6; max-width: 800px; margin: auto; padding: 20px; background-color: #f9f9f9; border-radius: 10px;"></div>
+    <h2 style="color: #2c3e50; text-align: center;">Welcome to the Financial Advisory Experiment</h2>
+    <p style=" color: #34495e; text-align: center;">Please read the instructions carefully before beginning.</p>
+    <p style=" color: #34495e;">
+        In this experiment, you will role-play as a user profile and decide whether to purchase a stock by interacting with a financial advisor over four candidate stocks.
+    </p>
+    <div style="background-color: #eaf7f7; padding: 15px; border-left: 5px solid #17a2b8; margin-bottom: 20px;">
+        <strong>Step 1: Preference Elicitation Stage</strong>
+        <p>
+            During this stage, financial advisors will ask you a series of questions to gather insights into your investment preferences and needs. The information you provide will be used to guide the discussions and decisions in the subsequent stages. You will be assigned a user narrative that describes an investor interested in buying individual stocks but unsure of which to choose. <strong>Review the narrative thoroughly and role-play as the investor described.</strong>
+        </p>
+    </div>
+    <div style="background-color: #f2f5ff; padding: 15px; border-left: 5px solid #6c63ff; margin-bottom: 20px;">
+        <strong>Step 2: Financial Decision Stage</strong>
+        <p>
+            You will go through four rounds of financial decisions. Each round consists of a “Discussion (Discuss)” and an “Evaluation (Eval)” phase. Please move through the following sequence: 1-1: Discuss → 1-2: Eval → 2-1: Discuss → 2-2: Eval → … → 4-2: Eval.
+        </p>
+        <div style="margin-left: 20px;">
+            <h4 style="color: #6c63ff;">Discussion Phase (e.g., 1-1: Discuss)</h4>
+            <p style="color: #34495e;">
+                You will receive general instructions and information about the candidate stock, which has been <strong>randomly selected for this exploration</strong>. After understanding the instructions, engage with the financial advisor to make financial decisions. <strong>Once you feel that you have gathered enough information to make a financial decision, you can move on to the evaluation phase.</strong>
+                Please note, the candidate stock is <strong>not a recommendation</strong> from the financial advisor.
+            </p>
+            <h4 style="color: #6c63ff;">Evaluation Phase (e.g., 1-2: Eval)</h4>
+            <p style=" color: #34495e;">
+                Once you feel informed, switch to the Evaluation tab and complete your evaluation for the stock.
+            </p>
+            <h4 style="color: #6c63ff;">Next Round (e.g., 2-1: Discuss)</h4>
+            <p style=" color: #34495e;">
+                After completing the evaluation for one stock, move to the next stock tab and repeat the process. Continue until all four stocks have been evaluated.
+            </p>
+        </div>
+    </div>
+    <div style="background-color: #fff8e1; padding: 15px; border-left: 5px solid #ffc107; margin-bottom: 20px;">
+        <strong>Step 3: Final Evaluation</strong>
+        <p style="color: #34495e;">
+            Based on your conversations with your financial advisor, you will first rank the individual stocks according to your desire to invest in each one, then evaluate the advisor by answering the questions.
+            <strong>Assign a unique rank to each stock</strong> (1 being the most preferred, 4 being the least preferred), and <strong>answer all the questions</strong> (1 being strongly disagree, 7 being strongly agree).
+        </p>
+    </div>
+    <!-- Cautionary Guidelines -->
+    <div style="background-color: #fdecea; padding: 15px; border-left: 5px solid #e74c3c; margin-top: 20px;">
+        <h4 style="color: #e74c3c;">Cautionary Guidelines</h4>
+        <ul style="color: #34495e;">
+            <li>Do not <strong>refresh</strong> or <strong>reload</strong> the page. Doing so will result in <strong>loss of data</strong>, and you will have to <strong>restart the experiment</strong> from the beginning.</li>
+            <li>Please move through the following sequence: <strong>Experiment Instruction</strong> → <strong>Preference Elicitation Stage</strong> → <strong>Financial Decision Stage</strong> → <strong>Final Evaluation</strong>.</li>
+        </ul>
+    </div>

_static/html/system_instruction_preference_elicitation.html ADDED Viewed

	@@ -0,0 +1,21 @@

+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <!-- Heading -->
+    <h2 style="color: #2c3e50; text-align: center; margin-bottom: 20px; font-size: 20px; font-weight: 600;">
+        Instruction: Preference Elicitation Stage
+    </h2>
+    <!-- User Instruction -->
+    <!-- <p style="text-align: left; font-size: 16px; color: #34495e; margin-bottom: 20px;">
+        It is December 31, 2023. You are an investor interested in purchasing individual stocks. You understand and accept the associated risks, and you’ve come to consult a financial advisor for guidance on which stocks may suit your needs.
+        In this stage, the financial advisor will ask you several questions to better understand your investment goals and preferences. When answering, it is not necessary to have a preference for every aspect of investing. If you do not have a preference regarding a particular dimension, you may simply state, “I don’t have a preference on this dimension.” Additionally, if there is anything you do not understand in what the advisor says, feel free to ask questions for clarification. This will help you gain a deeper understanding of the advice provided.
+        To interact with the financial advisor, first push the start conversation button. Then, type your message in the User Input textbox and press the Send This Message to Advisor button. If the response from the financial advisor is cut off due to word limitations, press the Show More of the Advisor’s Answer button to have the advisor continue the conversation. If you already have enough information to make a decision, you don’t need to press the Show More of the Advisor’s Answer button.
+    </p> -->
+    <p style="text-align: left; font-size: 16px; color: #34495e; margin-bottom: 20px; line-height: 1.6;">
+        It is December 31, 2023. You are an investor interested in purchasing individual stocks. You understand and accept the associated risks, and you’ve come to consult a financial advisor for guidance on which stocks may suit your needs.
+        <br><br>
+        This stage aims to explore and deepen the understanding of your investment preferences. Your financial advisor will ask several questions to better understand your investment goals and preferences. You don’t need to have a preference for every aspect of investing. <strong>If you’re asked about a topic where you have no preference, simply say, “I don’t have a preference on this topic.”</strong> Note that this stage focuses on your investment preferences. Specific details about individual stocks should be discussed during the financial decision stage.
+        <strong> Feel free to ask questions for clarification</strong> if there is anything you do not understand in what the advisor says. This will help you gain a deeper understanding of the advice provided.
+        <br><br>
+        To interact with the financial advisor, first push the <strong>Start Conversation</strong> button. Then, type your message in the <strong>User Input</strong> textbox and press the <strong>Send This Message to Advisor</strong> button. If the response from the financial advisor is cut off due to word limitations, press the <strong>Show More of the Advisor’s Answer</strong> button to have the advisor continue the conversation. If you already have enough information to make a decision, you don’t need to press the <strong>Show More of the Advisor’s Answer</strong> button.
+    </p>
+</div>

_static/html/user_narrative.html ADDED Viewed

	@@ -0,0 +1,8 @@

+<!-- User Narrative (Bold label, Normal narrative) -->
+<div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+    User Narrative
+</div>
+<div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+    {user_narrative}
+</div>
+</div>

_static/txt/general_instruction_button.txt ADDED Viewed

	@@ -0,0 +1 @@

+ To interact with the financial advisor, first push the start conversation button. Then, type your message in the Input: User Input textbox and press the Send: User Input button. If the response from the financial advisor is cut off due to word limitations, press the Continue button to have the advisor continue the conversation. If the response from the financial advisor is cut off due to word limitations, press the “Continue” button to have the advisor continue the conversation. If you already have enough information to make a decision, you don’t need to press the “Continue” button.

_static/txt/general_instruction_task.txt ADDED Viewed

	@@ -0,0 +1 @@

+ It is December 31, 2023. You are an investor interested in purchasing individual stocks. You understand and accept the risks involved, and you’ve come to consult a financial advisor for guidance on which individual stocks might suit your needs. In this experiment, you will be presented with one stock per round over five rounds (a total of five stocks). For each stock, engage with the financial advisor to determine whether the stock is suitable for your needs or not. If you come across unfamiliar financial concepts or don’t fully understand what the financial advisor says, be sure to ask for definitions or explanations.

_static/txt/personality_ext.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ You are extroverted (affectionate, friendly, fun-loving, confident), agreeable (cheerful, trusting, amiable, humble, polite, helpful), low in conscientious (reliable, consistent, perceptive), open to experience (insightful, original, clever, daring), and emotionally stable.

_static/txt/personality_int.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ You are introverted (reserved, quiet, insecure), antagonistic (skeptical, blunt, independent), conscientious (organized, disciplined, responsible), closed to experience (practical, thoughtful, cautious), and neurotic (anxious, nervous)

_static/txt/system_instruction_non_personalization.txt ADDED Viewed

	@@ -0,0 +1 @@

+ You are a professional financial advisor speaking with a customer who is interested in purchasing individual stocks. In this session, you are faced with a candidate stock and work together to understand if it aligns with the customer. Remember, the stock was selected randomly, and you are not recommending this specific stock, nor do you know whether the customer has any particular interest in it. Your task is to interact with the customer, using the stock’s details to help them determine whether the stock is a good fit for them. Do not attempt to collect any users’ information, such as risk tolerance or preferred industries. Instead, assist the user in a non-personalized way. First, start the conversation by providing a brief description of the company, and then ask the customer what they would like to know more about. When asking questions to the customer, incorporate both open-ended and closed-ended questions when relevant, rather than sticking to only closed-ended questions. In this session, keep the conversation centered on the current candidate stock. Avoid discussing other stocks unless you are making a direct comparison to the candidate stock. If users attempt to shift the focus to other stocks, remind them to stay on topic or suggest moving to the next round. The main focus should always be the candidate stock. If the customer is unfamiliar with any financial concepts, explain them to help the customer make an informed decision. If you do not have the information the client has requested, please be honest and inform them that the data is not available. Keep responses concise, AT MOST ONE HUNDRED WORDS. If additional information is necessary, a longer response is acceptable, but aim to be brief and to the point.

_static/txt/system_instruction_personality.txt ADDED Viewed

	@@ -0,0 +1 @@

+ You are a professional financial advisor speaking with a customer who is interested in purchasing individual stocks. {personality} Emphasize the personality in the conversation. Do not include any expressions in parentheses such as pauses, hesitations, or physical actions. The dialogue should focus purely on the verbal content of the conversation. In this session, you are faced with a candidate stock and work together to understand if it aligns with the customer. It’s important to tailor the information based on the user’s profile to ensure the conversation is personalized. Remember, the stock was selected randomly, and you are not recommending this specific stock, nor do you know whether the customer has any particular interest in it. User profile is provided below under “Previous Conversations with the Customer about the User Profile.” Your task is to interact with the customer, using the stock’s details and the user profile to help them determine whether the stock is a good fit for them in a personalized manner. First, start the conversation by providing a brief description of the company in a personalized manner, highlighting both the ways in which the company fits the user’s profile and any potential misalignments, and then ask the customer what they would like to know more about. When asking questions to the customer, incorporate both open-ended and closed-ended questions when relevant, rather than sticking to only closed-ended questions. In this session, keep the conversation centered on the current candidate stock. Avoid discussing other stocks unless you are making a direct comparison to the candidate stock. If users attempt to shift the focus to other stocks, remind them to stay on topic or suggest moving to the next round. The main focus should always be the candidate stock. If the customer is unfamiliar with any financial concepts, explain them to help the customer make an informed decision. If you do not have the information the client has requested, please be honest and inform them that the data is not available. Keep responses concise, AT MOST ONE HUNDRED WORDS. If additional information is necessary, a longer response is acceptable, but aim to be brief and to the point.

_static/txt/system_instruction_personalization.txt ADDED Viewed

	@@ -0,0 +1 @@

+ You are a professional financial advisor speaking with a customer who is interested in purchasing individual stocks. In this session, you are faced with a candidate stock and work together to understand if it aligns with the customer. It’s important to tailor the information based on the user’s profile to ensure the conversation is personalized. Remember, the stock was selected randomly, and you are not recommending this specific stock, nor do you know whether the customer has any particular interest in it. User profile is provided below under “Previous Conversations with the Customer about the User Profile.” Your task is to interact with the customer, using the stock’s details and the user profile to help them determine whether the stock is a good fit for them in a personalized manner. First, start the conversation by providing a brief description of the company in a personalized manner, highlighting both the ways in which the company fits the user’s profile and any potential misalignments, and then ask the customer what they would like to know more about. When asking questions to the customer, incorporate both open-ended and closed-ended questions when relevant, rather than sticking to only closed-ended questions. In this session, keep the conversation centered on the current candidate stock. Avoid discussing other stocks unless you are making a direct comparison to the candidate stock. If users attempt to shift the focus to other stocks, remind them to stay on topic or suggest moving to the next round. The main focus should always be the candidate stock. If the customer is unfamiliar with any financial concepts, explain them to help the customer make an informed decision. If you do not have the information the client has requested, please be honest and inform them that the data is not available. Keep responses concise, AT MOST ONE HUNDRED WORDS. If additional information is necessary, a longer response is acceptable, but aim to be brief and to the point.

_static/txt/system_instruction_preference_elicitation.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+You are a financial advisor discussing individual stocks with a customer. Your goal is to understand their investment preferences in the following areas: preferred industries, value or growth stocks, dividend or non-dividend stocks, and cyclical or non-cyclical stocks. Engage the client in conversation, addressing each topic one by one. Start conversation by asking the preferred industry first.
+Keep responses concise (AT MOST EIGHTY WORDS). If needed, longer responses are acceptable, but aim to be brief. Avoid discussing topics outside of these preferences. The purpose of this stage is to understand the customers’ investment preferences. Please avoid discussing specific stocks during this process. If the client tries to shift the focus, remind them that specific stock details will be covered in the next round, and this session is solely about preferences. If they are unfamiliar with any financial concepts, provide clear explanations to assist them.
+Once you’ve gathered all the information, say: *“Thank you for the conversation, please move on to the next section.”*

_static/txt/system_instruction_preference_elicitation_personality.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+You are a professional financial advisor discussing individual stocks with a customer. {personality} Emphasize the personality in the conversation. Do not include any expressions in parentheses such as pauses, hesitations, or physical actions. The dialogue should focus purely on the verbal content of the conversation. Your goal is to understand their investment preferences in the following areas: preferred industries, value or growth stocks, dividend or non-dividend stocks, and cyclical or non-cyclical stocks. Engage the client in conversation, addressing each topic one by one. Start conversation by asking the preferred industry first.
+Keep responses concise (AT MOST EIGHTY WORDS). If needed, longer responses are acceptable, but aim to be brief. Avoid discussing topics outside of these preferences. The purpose of this stage is to understand the customers’ investment preferences. Please avoid discussing specific stocks during this process. If the client tries to shift the focus, remind them that specific stock details will be covered in the next round, and this session is solely about preferences. If they are unfamiliar with any financial concepts, provide clear explanations to assist them.
+Once you’ve gathered all the information, say: *“Thank you for the conversation, please move on to the next section.”*

_static/txt/system_summarization_user_preference_elicitation.txt ADDED Viewed

	@@ -0,0 +1 @@

+ You are a financial advisor. Summarize a previous conversation with a customer about their investment preferences in four areas: preferred industries, value vs. growth stocks, dividend vs. non-dividend stocks, and cyclical vs. non-cyclical stocks. If the customer has not expressed a preference in any of these areas, clearly indicate that the preference for that specific aspect has not been discussed. Keep the summary very simple, omitting any unnecessary details.

app.py ADDED Viewed

	@@ -0,0 +1,1392 @@

+import sys
+import os
+from datetime import datetime
+import json
+import uuid
+from pathlib import Path
+from huggingface_hub import CommitScheduler, login
+from datasets import load_dataset
+import gradio as gr
+import markdown
+from together import Together
+ROOT_FILE = os.path.join(os.path.dirname(os.path.abspath(__file__)), "./")
+sys.path.append(ROOT_FILE)
+from components.induce_personality import construct_big_five_words
+from components.chat_conversation import (
+    # format_message_history,
+    format_user_message,
+    format_context,
+    gradio_to_huggingface_message,
+    huggingface_to_gradio_message,
+    # get_system_instruction,
+    prepare_tokenizer,
+    # format_rag_context,
+    conversation_window,
+    generate_response_local_api,
+    generate_response_together_api,
+    generate_response_debugging,
+)
+from components.constant import (
+    CONV_WINDOW,
+    API_URL,
+)
+from components.induce_personality import (
+    build_personality_prompt,
+)
+LOG_DIR = os.path.join(ROOT_FILE, "log/api/")
+if os.path.exists(LOG_DIR) is False:
+    os.makedirs(LOG_DIR)
+# Load Static Files
+STATIC_FILE = os.path.join(ROOT_FILE, "_static")
+LOG_DIR = os.path.join(ROOT_FILE, "log/test_session/")
+INSTRUCTION_PAGE_FILE = os.path.join(STATIC_FILE, "html/instruction_page.html")
+USER_NARRATIVE_FILE = os.path.join(STATIC_FILE, "html/user_narrative.html")
+PREFERENCE_ELICITATION_TASK_FILE = os.path.join(STATIC_FILE, "html/system_instruction_preference_elicitation.html")
+EVALUATION_INSTRUCTION_FILE = os.path.join(STATIC_FILE, "html/evaluation_instruction.html")
+GENERAL_INSTRUCTION_FILE = os.path.join(STATIC_FILE, "html/general_instruction.html")
+FINAL_EVALUATION_FILE = os.path.join(STATIC_FILE, "html/final_evaluation.html")
+SYSTEM_INSTRUCTION_PERSONALIZATION_FILE = os.path.join(STATIC_FILE, "txt/system_instruction_personalization.txt")
+SYSTEM_INSTRUCTION_NON_PERSONALIZATION_FILE = os.path.join(
+    STATIC_FILE, "txt/system_instruction_non_personalization.txt"
+)
+SYSTEM_INSTRUCTION_PERSONALITY_FILE = os.path.join(STATIC_FILE, "txt/system_instruction_personality.txt")
+SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION_FILE = os.path.join(
+    STATIC_FILE, "txt/system_instruction_preference_elicitation.txt"
+)
+SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION_PERSONALITY_FILE = os.path.join(
+    STATIC_FILE, "txt/system_instruction_preference_elicitation_personality.txt"
+)
+SUMMARIZATION_PROMPT_FILE = os.path.join(STATIC_FILE, "txt/system_summarization_user_preference_elicitation.txt")
+PERSONALITY_EXT_FILE = os.path.join(STATIC_FILE, "txt/personality_ext.txt")
+PERSONALITY_INT_FILE = os.path.join(STATIC_FILE, "txt/personality_int.txt")
+uuid_this_session = str(uuid.uuid4())
+system_order = "first"
+feedback_dir = Path("user_feedback_debug/")
+feedback_file_interaction = feedback_dir / f"interaction_{uuid_this_session}_{system_order}.json"
+feedback_file_summarization = feedback_dir / f"summarization_{uuid_this_session}_{system_order}.json"
+feedback_file_round_evaluation = feedback_dir / f"round_evaluation_{uuid_this_session}_{system_order}.json"
+feedback_file_final_ranking = feedback_dir / f"final_ranking_{uuid_this_session}_{system_order}.json"
+feedback_file_final_survey = feedback_dir / f"final_survey_{uuid_this_session}_{system_order}.json"
+feedback_folder = feedback_file_interaction.parent
+feedback_folder.mkdir(parents=True, exist_ok=True)  # Ensure the directory exists
+scheduler = CommitScheduler(
+    repo_id=os.getenv("LOGGING_FILE"),
+    repo_type="dataset",
+    folder_path=feedback_folder,
+    path_in_repo="data",
+    token=os.getenv("HUGGINGFACE_HUB_TOKEN"),
+    every=1,
+)
+# Function to save user feedback
+def save_feedback(user_id: str, uuid: str, type: str, value, feedback_file) -> None:
+    """
+    Append input/outputs and user feedback to a JSON Lines file using a thread lock to avoid concurrent writes from different users.
+    """
+    timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+    with scheduler.lock:
+        with feedback_file.open("a") as f:
+            f.write(
+                json.dumps({"user_id": user_id, "uuid": uuid, "timestamp": timestamp, "type": type, "value": value})
+            )
+            f.write("\n")
+# Load the required static content from files
+def load_static_content(file_path):
+    with open(file_path, "r") as f:
+        return f.read()
+def ensure_directory_exists(directory_path):
+    """Ensures the given directory exists; creates it if it does not."""
+    if not os.path.exists(directory_path):
+        os.makedirs(directory_path)
+INSTRUCTION_PAGE = load_static_content(INSTRUCTION_PAGE_FILE)
+EVALUATION_INSTRUCTION = load_static_content(EVALUATION_INSTRUCTION_FILE)
+GENERAL_INSTRUCTION = load_static_content(GENERAL_INSTRUCTION_FILE)
+USER_NARRATIVE = load_static_content(USER_NARRATIVE_FILE)
+PREFERENCE_ELICITATION_TASK = load_static_content(PREFERENCE_ELICITATION_TASK_FILE)
+FINAL_EVALUATION = load_static_content(FINAL_EVALUATION_FILE)
+SYSTEM_INSTRUCTION_PERSONALIZATION = load_static_content(SYSTEM_INSTRUCTION_PERSONALIZATION_FILE)
+SYSTEM_INSTRUCTION_NON_PERSONALIZATION = load_static_content(SYSTEM_INSTRUCTION_NON_PERSONALIZATION_FILE)
+SYSTEM_INSTRUCTION_PERSONALITY = load_static_content(SYSTEM_INSTRUCTION_PERSONALITY_FILE)
+SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION = load_static_content(SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION_FILE)
+SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION_PERSONALITY = load_static_content(
+    SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION_PERSONALITY_FILE
+)
+SUMMARIZATION_PROMPT = load_static_content(SUMMARIZATION_PROMPT_FILE)
+PERSONALITY_EXT = load_static_content(PERSONALITY_EXT_FILE)
+PERSONALITY_INT = load_static_content(PERSONALITY_INT_FILE)
+# Other constants
+FIRST_MESSAGE = "Hey"
+USER_PREFERENCE_SUMMARY = True
+DEBUG = False
+API_TYPE = "together"
+assert API_TYPE in ["together", "local", "debug"], "The API should be either 'together' or 'local'"
+if API_TYPE == "together":
+    TOGETHER_CLIENT = Together(api_key=os.getenv("TOGETHER_API_KEY"))
+def generate_username_pwd_list(data):
+    user_list = []
+    demo_list = []
+    for index, row in data.iterrows():
+        user_list.append((row["user"], str(row["pwd"])))
+        demo_list.append((row["demo"], str(row["pwd"])))
+    return user_list, demo_list
+def load_username_and_pwd():
+    login(token=os.environ["HUGGINGFACE_HUB_TOKEN"])
+    dataset = load_dataset(os.getenv("USER_PWD_FILE"))
+    df = dataset["train"].to_pandas()
+    user_list, demo_list = generate_username_pwd_list(df)
+    return user_list, demo_list
+def get_context_list(synthetic_data_path):
+    # Load data from the synthetic data file
+    with open(synthetic_data_path, "r") as f:
+        data = [json.loads(line) for line in f]
+    return data
+def add_ticker_prefix(ticker_list, context_list):
+    res = []
+    for ticker, context in zip(ticker_list, context_list):
+        res.append(f"{ticker}: {context}")
+    return res
+def build_raw_context_list(context_dict):
+    return context_dict["data"]
+def build_context(context_dict):
+    return [build_context_element(context) for context in context_dict["data"]]
+def build_context_element(context):
+    # [{topic: ex, data: {}}, {..}, ..]
+    # Extract information from the context
+    ticker = context["ticker"]
+    sector = context["sector"]
+    business_summary = context["business_summary"]
+    name = context["short_name"]
+    stock_price = context["price_data"]
+    earning = context["earning_summary"]
+    beta = context["beta"]
+    # Build the context string
+    stock_candidate = f"Stock Candidate: {name}"
+    stock_info = f"Stock Information: \nIndustry - {sector}, \nBeta (risk indicator) - {beta}, \nEarning Summary - {earning}\n, 2023 Monthly Stock Price - {stock_price}\n, Business Summary - {business_summary}"
+    context_list = [stock_candidate, stock_info]
+    # Combine all parts into a single string
+    return "\n".join(context_list)
+def get_user_narrative_html(user_narrative):
+    return USER_NARRATIVE.replace("{user_narrative}", user_narrative).replace("\n", "<br>")
+def get_user_narrative_from_raw(raw_narrative):
+    return get_user_narrative_html(markdown.markdown(raw_narrative.replace("\n", "<br>")))
+def get_task_instruction_for_user(context):
+    ticker_name = context["short_name"]
+    user_narrative = context["user_narrative"]
+    user_narrative = user_narrative.replace("\n", "<br>")
+    html_user_narrative = markdown.markdown(user_narrative)
+    general_instruction = GENERAL_INSTRUCTION
+    round_instruction = f"""
+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <!-- Stock Information (Bold label, Normal ticker name) -->
+    <h2 style="color: #2c3e50; text-align: center; margin-bottom: 20px; font-size: 20px; font-weight: 600;">
+        Round Info
+    </h2>
+    <div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+        Stock
+    </div>
+    <div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+        <span style="font-weight: bold;">
+            This Round's Stock:
+        </span>
+        {ticker_name}
+    </div>
+    <!-- User Narrative (Bold label, Normal narrative) -->
+    <div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+        User Narrative
+    </div>
+    <div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+        {html_user_narrative}
+    </div>
+</div>"""
+    return general_instruction, round_instruction
+def display_system_instruction_with_html(
+    system_instruction,
+):
+    html_system_instruction = f"""
+        <p style="text-align: left; margin-bottom: 10px;">
+            {system_instruction}
+        </p>
+    """
+    return html_system_instruction
+def log_action(user_id, tab_name, action, details):
+    """
+    Log actions for each tab (stock).
+    """
+    log_file_dir = os.path.join(LOG_DIR, f"{user_id}")
+    if os.path.exists(log_file_dir) is False:
+        os.makedirs(log_file_dir)
+    log_file = os.path.join(log_file_dir, f"{tab_name}.txt")
+    with open(log_file, "a") as f:
+        f.write(f"Action: {action} | Details: {details}\n")
+def add_user_profile_to_system_instruction(
+    user_id, system_instruction, user_preference_elicitation_data, summary, terminator
+):
+    exp_id = int(user_id.split("_")[-3])
+    # exp_id = 1 => No personalization
+    if exp_id == 1:
+        return system_instruction
+    if summary:
+        if user_preference_elicitation_data["summary_history"] == "":
+            # Format prompt
+            summarization_prompt = SUMMARIZATION_PROMPT + "\nPrevious Conversations: {}".format(
+                user_preference_elicitation_data["history"]
+            )
+            summarization_instruction = [{"role": "system", "content": summarization_prompt}]
+            if API_TYPE == "local":
+                summ, _ = generate_response_local_api(summarization_instruction, terminator, 512, API_URL)
+            elif API_TYPE == "together":
+                summ, _ = generate_response_together_api(summarization_instruction, 512, TOGETHER_CLIENT)
+            else:
+                summ, _ = generate_response_debugging(summarization_instruction)
+            user_preference_elicitation_data["summary_history"] = summ
+            # log_action(user_id, "Prompt", "Preference Elicitation Summarization", summ)
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "preference_elicitation_summarization",
+                {"summarization": summ},
+                feedback_file_summarization,
+            )
+        system_instruction += f"\nUser Profile collected in the previous conversations: {user_preference_elicitation_data['summary_history']}\n"
+    else:
+        system_instruction += (
+            f"\nUser Profile collected in the previous conversations: {user_preference_elicitation_data['history']}\n"
+        )
+    return system_instruction
+def likert_evaluation(content):
+    return gr.Radio(
+        [1, 2, 3, 4, 5, 6, 7],
+        label=f"{content}",
+        show_label=True,
+    )
+def reorder_list_based_on_user_in_narrative_id(user_in_narrative_id, target_list):
+    # user_in_narrative
+    random_order = {"0": [3, 2, 1, 0], "1": [1, 0, 3, 2], "2": [2, 1, 0, 3], "3": [1, 3, 2, 0], "4": [0, 3, 1, 2]}
+    user_in_narrative_random = random_order[user_in_narrative_id]
+    return [target_list[i] for i in user_in_narrative_random]
+def create_demo():
+    global context_info_list, terminator
+    def tab_creation_exploration_stage(order, comp, context):
+        english_order = ["1", "2", "3", "4", "5"]
+        with gr.Tab(f"{english_order[order]}-1:Discuss"):
+            general_instruction = gr.HTML(label="General Instruction")
+            with gr.Row():
+                with gr.Column():
+                    with gr.Row():
+                        round_instruction = gr.HTML(label="Round Instruction")
+                with gr.Column():
+                    with gr.Row():
+                        chatbot = gr.Chatbot(height=600)
+                    with gr.Row():
+                        start_conversation = gr.Button(value="Start Conversation")
+                    with gr.Row():
+                        msg = gr.Textbox(scale=1, label="User Input")
+                    with gr.Row():
+                        msg_button = gr.Button(value="Send This Message to Advisor", interactive=False)
+                        continue_button = gr.Button(value="Show More of the Advisor’s Answer", interactive=False)
+            with gr.Row():
+                clear = gr.ClearButton([msg, chatbot])
+        with gr.Tab(f"{english_order[order]}-2:Eval"):
+            with gr.Row():
+                gr.HTML(value=EVALUATION_INSTRUCTION)
+            with gr.Row():
+                likelihood = gr.Radio(
+                    [1, 2, 3, 4, 5, 6, 7],
+                    label="I am likely to purchase the stock (1 = Strongly Disagree, 7 = Strongly Agree)",
+                    show_label=True,
+                )
+                reason = gr.Textbox(
+                    scale=1,
+                    label="Reason for Your Choice (Explain Your Reasoning & Highlight Useful Parts of Conversation)",
+                    lines=5,
+                )
+            with gr.Row():
+                confidence = gr.Radio(
+                    [1, 2, 3, 4, 5, 6, 7],
+                    label="I am confident in my decision (1 = Strongly Disagree, 7 = Strongly Agree)",
+                    show_label=True,
+                )
+                familiarity = gr.Radio(
+                    [1, 2, 3, 4, 5, 6, 7],
+                    label="What was your level of familiarity with the candidate stock before the interaction? (1 = Not Familiar, 7 = Very Familiar)",
+                )
+            with gr.Row():
+                textbox = gr.HTML()
+                evaluation_send_button = gr.Button(value="Send: Evaluation")
+        return {
+            "comp": comp,
+            "system_instruction_context": context,
+            "start_conversation": start_conversation,
+            "msg_button": msg_button,
+            "continue_button": continue_button,
+            "chatbot": chatbot,
+            "msg": msg,
+            "reason": reason,
+            "likelihood": likelihood,
+            "confidence": confidence,
+            "familiarity": familiarity,
+            "evaluation_send_button": evaluation_send_button,
+            "general_instruction": general_instruction,
+            "round_instruction": round_instruction,
+            "textbox": textbox,
+        }
+    def tab_creation_preference_stage():
+        with gr.Row():
+            gr.HTML(value=PREFERENCE_ELICITATION_TASK, label="Preference Elicitation Task")
+        with gr.Row():
+            with gr.Column():
+                user_narrative = gr.HTML(label="User Narrative")
+            with gr.Column():
+                with gr.Row():
+                    elicitation_chatbot = gr.Chatbot(height=600)
+                with gr.Row():
+                    start_conversation = gr.Button(value="Start Conversation")
+                with gr.Row():
+                    msg = gr.Textbox(scale=1, label="User Input")
+                with gr.Row():
+                    msg_button = gr.Button(value="Send This Message to Advisor", interactive=False)
+                    continue_button = gr.Button(value="Show More of the Advisor’s Answer", interactive=False)
+        return {
+            "start_conversation": start_conversation,
+            "msg_button": msg_button,
+            "continue_button": continue_button,
+            "msg": msg,
+            "elicitation_chatbot": elicitation_chatbot,
+            "user_narrative": user_narrative,
+        }
+    def tab_final_evaluation():
+        with gr.Row():
+            gr.HTML(value=FINAL_EVALUATION)
+        with gr.Row():
+            gr.HTML(value="<h3>Rank the individual stocks below according to your desire to invest in each one.</h3>")
+        with gr.Row():
+            ranking_first_comp = gr.Dropdown(choices=[1, 2, 3, 4])
+            ranking_second_comp = gr.Dropdown(choices=[1, 2, 3, 4])
+            ranking_third_comp = gr.Dropdown(choices=[1, 2, 3, 4])
+            ranking_fourth_comp = gr.Dropdown(choices=[1, 2, 3, 4])
+        with gr.Row():
+            gr.HTML(
+                value='<h3>Choose how strongly you agree with each statement about the advisor (<strong style="color:red;">1 for Strongly Disagree</strong>, <strong style="color:green;">7 for Strongly Agree</strong>).</h3>'
+            )
+        with gr.Row():
+            perceived_personalization = likert_evaluation("The advisor understands my needs")
+            emotional_trust = likert_evaluation("I feel content about relying on this advisor for my decisions")
+        with gr.Row():
+            trust_in_competence = likert_evaluation("The advisor has good knowledge of the stock")
+            intention_to_use = likert_evaluation(
+                "I am willing to use this advisor as an aid to help with my decision about which stock to purchase"
+            )
+        with gr.Row():
+            usefulness = likert_evaluation("The advisor gave me good suggestions")
+            overall_satisfaction = likert_evaluation("Overall, I am satisfied with the advisor")
+        with gr.Row():
+            providing_information = likert_evaluation("The advisor provides the financial knowledge needed")
+        with gr.Row():
+            textbox = gr.HTML()
+            submit_ranking = gr.Button(value="Submit Final Evaluation")
+        return {
+            "first": ranking_first_comp,
+            "second": ranking_second_comp,
+            "third": ranking_third_comp,
+            "fourth": ranking_fourth_comp,
+            "evaluators": {
+                "perceived_personalization": perceived_personalization,
+                "emotional_trust": emotional_trust,
+                "trust_in_competence": trust_in_competence,
+                "intention_to_use": intention_to_use,
+                "usefulness": usefulness,
+                "overall_satisfaction": overall_satisfaction,
+                "providing_information": providing_information,
+            },
+            "submit_ranking": submit_ranking,
+            "text_box": textbox,
+        }
+    def click_control_exploration_stage(
+        tabs, user_id, tab_session, user_preference_elicitation_session, system_description_without_context
+    ):
+        (
+            comp,
+            system_instruction_context,
+            start_conversation,
+            msg_button,
+            continue_button,
+            chatbot,
+            msg,
+            reason,
+            likelihood,
+            confidence,
+            familiarity,
+            evaluation_send_button,
+            textbox,
+        ) = (
+            tabs["comp"],
+            tabs["system_instruction_context"],
+            tabs["start_conversation"],
+            tabs["msg_button"],
+            tabs["continue_button"],
+            tabs["chatbot"],
+            tabs["msg"],
+            tabs["reason"],
+            tabs["likelihood"],
+            tabs["confidence"],
+            tabs["familiarity"],
+            tabs["evaluation_send_button"],
+            tabs["textbox"],
+        )
+        system_instruction = ""
+        start_conversation.click(
+            lambda user_id, tab_session, history, comp, user_preference_elicitation_session, system_description_without_context, system_instruction_context: respond_start_conversation(
+                user_id,
+                tab_session,
+                history,
+                system_instruction,
+                comp,
+                user_preference_elicitation_data=user_preference_elicitation_session,
+                system_description_without_context=system_description_without_context,
+                system_instruction_context=system_instruction_context,
+            ),
+            [
+                user_id,
+                tab_session,
+                chatbot,
+                comp,
+                user_preference_elicitation_session,
+                system_description_without_context,
+                system_instruction_context,
+            ],
+            [tab_session, chatbot, start_conversation, msg_button, continue_button],
+        )
+        msg_button.click(
+            lambda user_id, tab_session, message, history, comp, user_preference_elicitation_session, system_description_without_context, system_instruction_context: respond(
+                user_id,
+                tab_session,
+                message,
+                tab_session["history"],
+                system_instruction,
+                comp,
+                user_preference_elicitation_data=user_preference_elicitation_session,
+                system_description_without_context=system_description_without_context,
+                system_instruction_context=system_instruction_context,
+            ),
+            [
+                user_id,
+                tab_session,
+                msg,
+                chatbot,
+                comp,
+                user_preference_elicitation_session,
+                system_description_without_context,
+                system_instruction_context,
+            ],
+            [tab_session, msg, chatbot],
+        )
+        continue_button.click(
+            lambda user_id, tab_session, history, comp, user_preference_elicitation_session, system_description_without_context, system_instruction_context: respond_continue(
+                user_id,
+                tab_session,
+                tab_session["history"],
+                system_instruction,
+                comp,
+                user_preference_elicitation_data=user_preference_elicitation_session,
+                system_description_without_context=system_description_without_context,
+                system_instruction_context=system_instruction_context,
+            ),
+            [
+                user_id,
+                tab_session,
+                chatbot,
+                comp,
+                user_preference_elicitation_session,
+                system_description_without_context,
+                system_instruction_context,
+            ],
+            [tab_session, chatbot],
+        )
+        evaluation_send_button.click(
+            lambda user_id, comp, tab_session, reason, likelihood, confidence, familiarity, evaluation_send_button, textbox: respond_evaluation(
+                user_id,
+                tab_session,
+                {
+                    "reason": reason,
+                    "likelihood": likelihood,
+                    "confidence": confidence,
+                    "familiarity": familiarity,
+                },
+                comp,
+                evaluation_send_button,
+                textbox,
+            ),
+            [
+                user_id,
+                comp,
+                tab_session,
+                reason,
+                likelihood,
+                confidence,
+                familiarity,
+                evaluation_send_button,
+                textbox,
+            ],
+            [tab_session, reason, likelihood, confidence, familiarity, evaluation_send_button, textbox],
+        )
+    def click_control_preference_stage(
+        tabs, user_id, user_preference_elicitation_session, system_description_user_elicitation
+    ):
+        (
+            start_conversation,
+            msg_button,
+            continue_button,
+            elicitation_chatbot,
+            msg,
+        ) = (
+            tabs["start_conversation"],
+            tabs["msg_button"],
+            tabs["continue_button"],
+            tabs["elicitation_chatbot"],
+            tabs["msg"],
+        )
+        # nonlocal user_id
+        start_conversation.click(
+            lambda user_id, user_preference_elicitation_data, history, system_description_user_elicitation: respond_start_conversation(
+                user_id,
+                user_preference_elicitation_data,
+                history,
+                system_description_user_elicitation,
+                user_elicitation=True,
+            ),
+            [user_id, user_preference_elicitation_session, elicitation_chatbot, system_description_user_elicitation],
+            [user_preference_elicitation_session, elicitation_chatbot, start_conversation, msg_button, continue_button],
+        )
+        msg_button.click(
+            lambda user_id, tab_data, message, history, system_description_user_elicitation: respond(
+                user_id,
+                tab_data,
+                message,
+                tab_data["history"],
+                system_description_user_elicitation,
+                user_elicitation=True,
+            ),
+            [
+                user_id,
+                user_preference_elicitation_session,
+                msg,
+                elicitation_chatbot,
+                system_description_user_elicitation,
+            ],
+            [user_preference_elicitation_session, msg, elicitation_chatbot],
+        )
+        continue_button.click(
+            lambda user_id, tab_data, history, system_description_user_elicitation: respond_continue(
+                user_id,
+                tab_data,
+                tab_data["history"],
+                system_description_user_elicitation,
+                user_elicitation=True,
+            ),
+            [user_id, user_preference_elicitation_session, elicitation_chatbot, system_description_user_elicitation],
+            [user_preference_elicitation_session, elicitation_chatbot],
+        )
+    def click_control_final_evaluation(tabs, user_id, first_comp, second_comp, third_comp, fourth_comp, evaluators):
+        (
+            ranking_first_comp,
+            ranking_second_comp,
+            ranking_third_comp,
+            ranking_fourth_comp,
+        ) = (
+            tabs["first"],
+            tabs["second"],
+            tabs["third"],
+            tabs["fourth"],
+        )
+        (
+            perceived_personalization,
+            emotional_trust,
+            trust_in_competence,
+            intention_to_use,
+            usefulness,
+            overall_satisfaction,
+            providing_information,
+        ) = (
+            evaluators["perceived_personalization"],
+            evaluators["emotional_trust"],
+            evaluators["trust_in_competence"],
+            evaluators["intention_to_use"],
+            evaluators["usefulness"],
+            evaluators["overall_satisfaction"],
+            evaluators["providing_information"],
+        )
+        result_textbox = tabs["text_box"]
+        submit_ranking = tabs["submit_ranking"]
+        submit_ranking.click(
+            lambda user_id, first_comp, ranking_first_comp, second_comp, ranking_second_comp, third_comp, ranking_third_comp, fourth_comp, ranking_fourth_comp, perceived_personalization, emotional_trust, trust_in_competence, intention_to_use, usefulness, overall_satisfaction, providing_information, submit_ranking: respond_final_ranking(
+                user_id,
+                first_comp,
+                ranking_first_comp,
+                second_comp,
+                ranking_second_comp,
+                third_comp,
+                ranking_third_comp,
+                fourth_comp,
+                ranking_fourth_comp,
+                perceived_personalization,
+                emotional_trust,
+                trust_in_competence,
+                intention_to_use,
+                usefulness,
+                overall_satisfaction,
+                providing_information,
+                submit_ranking,
+            ),
+            # Input components (names and rankings)
+            [
+                user_id,
+                first_comp,
+                ranking_first_comp,
+                second_comp,
+                ranking_second_comp,
+                third_comp,
+                ranking_third_comp,
+                fourth_comp,
+                ranking_fourth_comp,
+                perceived_personalization,
+                emotional_trust,
+                trust_in_competence,
+                intention_to_use,
+                usefulness,
+                overall_satisfaction,
+                providing_information,
+                submit_ranking,
+            ],
+            # Output component(s) where you want the result to appear, e.g., result_textbox
+            [result_textbox, submit_ranking],
+        )
+    def respond(
+        user_id,
+        tab_data,
+        message,
+        history,
+        system_instruction,
+        tab_name=None,
+        user_elicitation=False,
+        user_preference_elicitation_data=None,
+        system_description_without_context=None,
+        system_instruction_context=None,
+    ):
+        """
+        Return:
+        msg
+        chat_history
+        retrieved_passage
+        rewritten_query
+        """
+        assert (
+            tab_name is not None or user_elicitation is True
+        ), "Tab name is required for the start of the conversation unless it is not preference elicitation."
+        # Add user profile to system instruction
+        if system_description_without_context is not None and system_instruction_context is not None:
+            system_instruction = system_description_without_context + "\n" + system_instruction_context
+        if not user_elicitation:
+            system_instruction = add_user_profile_to_system_instruction(
+                user_id,
+                system_instruction,
+                user_preference_elicitation_data,
+                summary=USER_PREFERENCE_SUMMARY,
+                terminator=terminator,
+            )
+        # From string to list [{"role":"user", "content": message}, ...]
+        history = gradio_to_huggingface_message(history)
+        # We can implement context window here as we need all the system interaction. We can cut some of the early interactions if needed.
+        history = conversation_window(history, CONV_WINDOW)
+        # Add system instruction to the history
+        history = format_context(system_instruction, history)
+        # Add user message to the history
+        history_with_user_utterance = format_user_message(message, history)
+        # Call API instead of locally handle it
+        if API_TYPE == "local":
+            outputs_text, history = generate_response_local_api(history_with_user_utterance, terminator, 128, API_URL)
+        elif API_TYPE == "together":
+            outputs_text, history = generate_response_together_api(history_with_user_utterance, 128, TOGETHER_CLIENT)
+        else:
+            outputs_text, history = generate_response_debugging(history_with_user_utterance)
+        # exclude system interaction and store the others in the history
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            # Log the user message and response
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {"type": tab_name, "role": "user", "content": message},
+                feedback_file_interaction,
+            )
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {"type": tab_name, "role": "assistant", "content": outputs_text},
+                feedback_file_interaction,
+            )
+            # log_action(user_id, tab_name, "User Message", message)
+            # log_action(user_id, tab_name, "Response", outputs_text)
+            # Store the updated history for this tab
+            tab_data["history"] = history
+        if user_elicitation:
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "Interaction",
+                {"type": "user_elicitation", "role": "user", "content": message},
+                feedback_file_interaction,
+            )
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "Interaction",
+                {"type": "user_elicitation", "role": "assistant", "content": outputs_text},
+                feedback_file_interaction,
+            )
+            # log_action(user_id, "User_Elicitation", "User Message", message)
+            # log_action(user_id, "User_Elicitation", "Response", outputs_text)
+            tab_data["history"] = history
+        return tab_data, "", history
+    def respond_start_conversation(
+        user_id,
+        tab_data,
+        history,
+        system_instruction,
+        tab_name=None,
+        user_elicitation=False,
+        user_preference_elicitation_data=None,
+        system_description_without_context=None,
+        system_instruction_context=None,
+    ):
+        assert (
+            tab_name is not None or user_elicitation is True
+        ), "Tab name is required for the start of the conversation unless it is not preference elicitation."
+        if system_description_without_context is not None and system_instruction_context is not None:
+            system_instruction = system_description_without_context + "\n" + system_instruction_context
+        if not user_elicitation:
+            system_instruction = add_user_profile_to_system_instruction(
+                user_id,
+                system_instruction,
+                user_preference_elicitation_data,
+                summary=USER_PREFERENCE_SUMMARY,
+                terminator=terminator,
+            )
+        history = gradio_to_huggingface_message(history)
+        history = format_context(system_instruction, history)
+        first_message = FIRST_MESSAGE
+        history_with_user_utterance = format_user_message(first_message, history)
+        max_length = 128 if user_elicitation else 256
+        if API_TYPE == "local":
+            outputs_text, history = generate_response_local_api(
+                history_with_user_utterance, terminator, max_length, API_URL
+            )
+        elif API_TYPE == "together":
+            outputs_text, history = generate_response_together_api(
+                history_with_user_utterance, max_length, TOGETHER_CLIENT
+            )
+        else:
+            outputs_text, history = generate_response_debugging(history_with_user_utterance)
+        # Format
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            # Log the user message and response
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {"type": tab_name, "role": "user", "content": first_message},
+                feedback_file_interaction,
+            )
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {"type": tab_name, "role": "assistant", "content": outputs_text},
+                feedback_file_interaction,
+            )
+            # log_action(user_id, tab_name, "User Message", first_message)
+            # log_action(user_id, tab_name, "Response", outputs_text)
+            # Store the updated history for this tab
+            tab_data["history"] = history
+        if user_elicitation:
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {"type": "user_elicitation", "role": "user", "content": first_message},
+                feedback_file_interaction,
+            )
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "Interaction",
+                {"type": "user_elicitation", "role": "assistant", "content": outputs_text},
+                feedback_file_interaction,
+            )
+            tab_data["history"] = history
+        return (
+            tab_data,
+            history,
+            gr.Button(value="Start Conversation", interactive=False),
+            gr.Button(value="Send This Message to Advisor", interactive=True),
+            gr.Button(value="Show More of the Advisor’s Answer", interactive=True),
+        )
+    def respond_continue(
+        user_id,
+        tab_data,
+        history,
+        system_instruction,
+        tab_name=None,
+        user_elicitation=False,
+        user_preference_elicitation_data=None,
+        system_description_without_context=None,
+        system_instruction_context=None,
+    ):
+        assert (
+            tab_name is not None or user_elicitation is True
+        ), "Tab name is required for the start of the conversation."
+        # Add user profile to system instruction
+        if system_description_without_context is not None and system_instruction_context is not None:
+            system_instruction = system_description_without_context + "\n" + system_instruction_context
+        if not user_elicitation:
+            system_instruction = add_user_profile_to_system_instruction(
+                user_id,
+                system_instruction,
+                user_preference_elicitation_data,
+                summary=USER_PREFERENCE_SUMMARY,
+                terminator=terminator,
+            )
+        message = "continue"
+        history = gradio_to_huggingface_message(history)
+        history = conversation_window(history, CONV_WINDOW)
+        history = format_context(system_instruction, history)
+        history_with_user_utterance = format_user_message(message, history)
+        if API_TYPE == "local":
+            outputs_text, history = generate_response_local_api(history_with_user_utterance, terminator, 128, API_URL)
+        elif API_TYPE == "together":
+            outputs_text, history = generate_response_together_api(history_with_user_utterance, 128, TOGETHER_CLIENT)
+        else:
+            outputs_text, history = generate_response_debugging(history_with_user_utterance)
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {
+                    "type": tab_name,
+                    "role": "user",
+                    "content": message,
+                },
+                feedback_file_interaction,
+            )
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {"type": tab_name, "role": "assistant", "content": outputs_text},
+                feedback_file_interaction,
+            )
+            # Update history for this tab
+            tab_data["history"] = history
+        if user_elicitation:
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {"type": "user_elicitation", "role": "user", "content": message},
+                feedback_file_interaction,
+            )
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "interaction",
+                {"type": "user_elicitation", "role": "assistant", "content": outputs_text},
+                feedback_file_interaction,
+            )
+            tab_data["history"] = history
+        return tab_data, history
+    def respond_evaluation(user_id, tab_data, evals, tab_name, evaluation_send_button, textbox):
+        # dropdown, readon_button, multi-evaluator
+        if evals["likelihood"] is None or evals["confidence"] is None or evals["familiarity"] is None:
+            return (
+                tab_data,
+                evals["reason"],
+                evals["likelihood"],
+                evals["confidence"],
+                evals["familiarity"],
+                evaluation_send_button,
+                """<div style="background-color: #f8d7da; color: #721c24; padding: 15px; border: 1px solid #f5c6cb; border-radius: 5px; margin-bottom: 20px;">
+                    <strong>Please make sure that you answer all the questions.</strong>
+                    </div>""",
+            )
+        else:
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "round_evaluation",
+                {**evals, "company": tab_name},
+                feedback_file_round_evaluation,
+            )
+            # log_action(user_id, tab_name, "Round Evaluation", "Following")
+            # for key, value in evals.items():
+            #     log_action(user_id, tab_name, key, value)
+            # Store the reason for this tab
+            tab_data["multi_evaluator"] = evals
+            evaluation_send_button = gr.Button(value="Evaluation receirved", interactive=False)
+            return (
+                tab_data,
+                evals["reason"],
+                evals["likelihood"],
+                evals["confidence"],
+                evals["familiarity"],
+                evaluation_send_button,
+                """<div style="background-color: #d4edda; color: #155724; padding: 15px; border: 1px solid #c3e6cb; border-radius: 5px; margin-bottom: 20px;">
+                        <strong>Thank you for submitting your evaluation. You may proceed to the next tab.</strong>
+                    </div>""",
+            )
+    def respond_final_ranking(
+        user_id,
+        first_comp,
+        ranking_first_comp,
+        second_comp,
+        ranking_second_comp,
+        third_comp,
+        ranking_third_comp,
+        fourth_comp,
+        ranking_fourth_comp,
+        perceived_personalization,
+        emotional_trust,
+        trust_in_competence,
+        intention_to_use,
+        usefulness,
+        overall_satisfaction,
+        providing_information,
+        submit_ranking,
+    ):
+        # make sure that they are not the same
+        ranking_list = [
+            ranking_first_comp,
+            ranking_second_comp,
+            ranking_third_comp,
+            ranking_fourth_comp,
+        ]
+        if len(set(ranking_list)) != len(ranking_list):
+            return (
+                """<div style="background-color: #f8d7da; color: #721c24; padding: 15px; border: 1px solid #f5c6cb; border-radius: 5px; margin-bottom: 20px;">
+    <strong>Please make sure that you are not ranking the same stock multiple times.</strong>
+</div>""",
+                submit_ranking,
+            )
+        if any(
+            var is None
+            for var in [
+                perceived_personalization,
+                emotional_trust,
+                trust_in_competence,
+                intention_to_use,
+                usefulness,
+                overall_satisfaction,
+                providing_information,
+            ]
+        ):
+            return (
+                """<div style="background-color: #f8d7da; color: #721c24; padding: 15px; border: 1px solid #f5c6cb; border-radius: 5px; margin-bottom: 20px;">
+    <strong>Please make sure that you answer all the statements.</strong>
+</div>""",
+                submit_ranking,
+            )
+        else:
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "final_ranking",
+                {
+                    "comp_order": [first_comp, second_comp, third_comp, fourth_comp],
+                    "ranking": ranking_list,
+                },
+                feedback_file_final_ranking,
+            )
+            save_feedback(
+                user_id,
+                uuid_this_session,
+                "final_ranking_survey",
+                {
+                    "perceived_personalization": perceived_personalization,
+                    "emotional_trust": emotional_trust,
+                    "trust_in_competence": trust_in_competence,
+                    "intention_to_use": intention_to_use,
+                    "usefulness": usefulness,
+                    "overall_satisfaction": overall_satisfaction,
+                    "providing_information": providing_information,
+                },
+                feedback_file_final_survey,
+            )
+            submit_ranking = gr.Button(value="Final evaluaiotn received", interactive=False)
+            return (
+                """<div style="background-color: #d4edda; color: #155724; padding: 15px; border: 1px solid #c3e6cb; border-radius: 5px; margin-bottom: 20px;">
+                        <strong>Thank you for participating in the experiment. This concludes the session. You may now close the tab.</strong>
+                    </div>""",
+                submit_ranking,
+            )
+    def get_context(index, raw_context_list, stock_context_list):
+        comp = raw_context_list[index]["short_name"]
+        context = stock_context_list[index]
+        general_instruction, round_instruction = get_task_instruction_for_user(raw_context_list[index])
+        return comp, context, general_instruction, round_instruction
+    def set_user_id(request: gr.Request):
+        #  DEBUG
+        user_id = "user_0_0_0"
+        # user_id = request.username
+        user_in_narrative_id = user_id.split("_")[-1]
+        narrative_id = user_id.split("_")[-2]
+        experiment_id = user_id.split("_")[-3]
+        return user_id, user_in_narrative_id, narrative_id, experiment_id
+    def get_inst_without_context(experiment_id):
+        # experiment_id = 1 => personalization
+        # experiment_id = 2 => no personalization
+        # experiment_id == 3 => ext personality
+        # experiment_id == 4 => int personality
+        if experiment_id == "0":
+            return SYSTEM_INSTRUCTION_PERSONALIZATION
+        elif experiment_id == "1":
+            return SYSTEM_INSTRUCTION_NON_PERSONALIZATION
+        elif experiment_id == "2":
+            return SYSTEM_INSTRUCTION_PERSONALITY.format(personality=PERSONALITY_EXT)
+        elif experiment_id == "3":
+            return SYSTEM_INSTRUCTION_PERSONALITY.format(personality=PERSONALITY_INT)
+    def get_user_preference_elicitation(experiment_id):
+        if experiment_id == "0" or experiment_id == "1":
+            return SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION
+        elif experiment_id == "2":
+            return SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION_PERSONALITY.format(personality=PERSONALITY_EXT)
+        elif experiment_id == "3":
+            return SYSTEM_INSTRUCTION_PREFERENCE_ELICITATION_PERSONALITY.format(personality=PERSONALITY_INT)
+    def get_stock_related_context(narrative_id, user_in_narrative_id):
+        raw_context_list = build_raw_context_list(context_info_list[int(narrative_id)])
+        stock_context_list = build_context(context_info_list[int(narrative_id)])
+        raw_context_list = reorder_list_based_on_user_in_narrative_id(user_in_narrative_id, raw_context_list)
+        stock_context_list = reorder_list_based_on_user_in_narrative_id(user_in_narrative_id, stock_context_list)
+        return raw_context_list, stock_context_list
+    def set_initial_values(request: gr.Request):
+        # Set user specific information (Session State)
+        user_id, user_in_narrative_id, narrative_id, experiment_id = set_user_id(request)
+        # System instruction without prompt
+        system_description_without_context = get_inst_without_context(experiment_id)
+        # user_preference_elicitation
+        system_description_user_elicitation = get_user_preference_elicitation(experiment_id)
+        # Stock related context
+        raw_context_list, stock_context_list = get_stock_related_context(narrative_id, user_in_narrative_id)
+        # User Narrative
+        user_narrative = get_user_narrative_from_raw(raw_context_list[0]["user_narrative"])
+        # Tab Context
+        first_comp, first_context, first_general_instruction, first_round_instruction = get_context(
+            0, raw_context_list, stock_context_list
+        )
+        second_comp, second_context, second_general_instruction, second_round_instruction = get_context(
+            1, raw_context_list, stock_context_list
+        )
+        third_comp, third_context, third_general_instruction, third_round_instruction = get_context(
+            2, raw_context_list, stock_context_list
+        )
+        fourth_comp, fourth_context, fourth_general_instruction, fourth_round_instruction = get_context(
+            3, raw_context_list, stock_context_list
+        )
+        # Final Evaluation
+        ranking_first_comp = gr.Dropdown(choices=[1, 2, 3, 4], label=first_comp)
+        ranking_second_comp = gr.Dropdown(choices=[1, 2, 3, 4], label=second_comp)
+        ranking_third_comp = gr.Dropdown(choices=[1, 2, 3, 4], label=third_comp)
+        ranking_fourth_comp = gr.Dropdown(choices=[1, 2, 3, 4], label=fourth_comp)
+        return (
+            user_id,
+            user_in_narrative_id,
+            narrative_id,
+            experiment_id,
+            system_description_without_context,
+            system_description_user_elicitation,
+            raw_context_list,
+            stock_context_list,
+            user_narrative,
+            first_comp,
+            first_context,
+            first_general_instruction,
+            first_round_instruction,
+            second_comp,
+            second_context,
+            second_general_instruction,
+            second_round_instruction,
+            third_comp,
+            third_context,
+            third_general_instruction,
+            third_round_instruction,
+            fourth_comp,
+            fourth_context,
+            fourth_general_instruction,
+            fourth_round_instruction,
+            ranking_first_comp,
+            ranking_second_comp,
+            ranking_third_comp,
+            ranking_fourth_comp,
+        )
+    with gr.Blocks(title="RAG Chatbot Q&A", theme="Soft") as demo:
+        # Set user specific information (Session State)
+        user_id = gr.State()
+        user_in_narrative_id = gr.State()
+        narrative_id = gr.State()
+        experiment_id = gr.State()
+        system_description_without_context = gr.State()
+        system_description_user_elicitation = gr.State()
+        # Context data
+        raw_context_list = gr.State()
+        stock_context_list = gr.State()
+        first_comp = gr.State()
+        first_context = gr.State()
+        second_comp = gr.State()
+        second_context = gr.State()
+        third_comp = gr.State()
+        third_context = gr.State()
+        fourth_comp = gr.State()
+        fourth_context = gr.State()
+        # Tab data
+        if DEBUG:
+            user_preference_elicitation_session = gr.State(
+                value={
+                    "history": "",
+                    "summary_history": """User Profile collected in the previous conversations: Based on our previous conversation, here's a summary of your investment preferences:
+    #     1. **Preferred Industries:** You're interested in investing in the healthcare sector, without a specific preference for sub-industries such as pharmaceuticals, medical devices, biotechnology, or healthcare services.
+    #     2. **Value vs. Growth Stocks:** You prefer growth stocks, which have the potential for high returns but may be riskier.
+    #     3. **Dividend vs. Non-Dividend Stocks:** You're open to both dividend and non-dividend growth stocks, focusing on reinvesting profits for future growth.
+    #     4. **Cyclical vs. Non-Cyclical Stocks:** You're interested in cyclical stocks, which are sensitive to economic fluctuations and tend to perform well during economic expansions.""",
+                }
+            )
+        else:
+            user_preference_elicitation_session = gr.State(value={"history": "", "summary_history": ""})
+        first_comp_session = gr.State(value={"history": [], "selection": "", "reason": ""})
+        second_comp_session = gr.State(value={"history": [], "selection": "", "reason": ""})
+        third_comp_session = gr.State(value={"history": [], "selection": "", "reason": ""})
+        fourth_comp_session = gr.State(value={"history": [], "selection": "", "reason": ""})
+        # EXperiment Instruction
+        with gr.Tab("Experiment Instruction") as instruction_tab:
+            gr.HTML(value=INSTRUCTION_PAGE, label="Experiment Instruction")
+        # User Preference Elicitation Tab
+        with gr.Tab("Preference Elicitation Stage") as preference_elicitation_tab:
+            user_preference_elicitation_tab = tab_creation_preference_stage()
+            user_narrative = user_preference_elicitation_tab["user_narrative"]
+            click_control_preference_stage(
+                user_preference_elicitation_tab,
+                user_id,
+                user_preference_elicitation_session,
+                system_description_user_elicitation,
+            )
+        with gr.Tab("Financial Decision Stage") as financial_decision:
+            # Experiment Tag
+            first_tab = tab_creation_exploration_stage(0, first_comp, first_context)
+            first_general_instruction, first_round_instruction = (
+                first_tab["general_instruction"],
+                first_tab["round_instruction"],
+            )
+            click_control_exploration_stage(
+                first_tab,
+                user_id,
+                first_comp_session,
+                user_preference_elicitation_session,
+                system_description_without_context,
+            )
+            second_tab = tab_creation_exploration_stage(1, second_comp, second_context)
+            second_general_instruction, second_round_instruction = (
+                second_tab["general_instruction"],
+                second_tab["round_instruction"],
+            )
+            click_control_exploration_stage(
+                second_tab,
+                user_id,
+                second_comp_session,
+                user_preference_elicitation_session,
+                system_description_without_context,
+            )
+            third_tab = tab_creation_exploration_stage(2, third_comp, third_context)
+            third_general_instruction, third_round_instruction = (
+                third_tab["general_instruction"],
+                third_tab["round_instruction"],
+            )
+            click_control_exploration_stage(
+                third_tab,
+                user_id,
+                third_comp_session,
+                user_preference_elicitation_session,
+                system_description_without_context,
+            )
+            fourth_tab = tab_creation_exploration_stage(3, fourth_comp, fourth_context)
+            fourth_general_instruction, fourth_round_instruction = (
+                fourth_tab["general_instruction"],
+                fourth_tab["round_instruction"],
+            )
+            click_control_exploration_stage(
+                fourth_tab,
+                user_id,
+                fourth_comp_session,
+                user_preference_elicitation_session,
+                system_description_without_context,
+            )
+        with gr.Tab("Final Evaluation Stage") as final_evaluation:
+            final_evaluation_tab = tab_final_evaluation()
+            (
+                ranking_first_comp,
+                ranking_second_comp,
+                ranking_third_comp,
+                ranking_fourth_comp,
+                evaluators,
+            ) = (
+                final_evaluation_tab["first"],
+                final_evaluation_tab["second"],
+                final_evaluation_tab["third"],
+                final_evaluation_tab["fourth"],
+                final_evaluation_tab["evaluators"],
+            )
+            click_control_final_evaluation(
+                final_evaluation_tab, user_id, first_comp, second_comp, third_comp, fourth_comp, evaluators
+            )
+        demo.load(
+            set_initial_values,
+            inputs=None,
+            outputs=[
+                user_id,
+                user_in_narrative_id,
+                narrative_id,
+                experiment_id,
+                system_description_without_context,
+                system_description_user_elicitation,
+                raw_context_list,
+                stock_context_list,
+                user_narrative,
+                first_comp,
+                first_context,
+                first_general_instruction,
+                first_round_instruction,
+                second_comp,
+                second_context,
+                second_general_instruction,
+                second_round_instruction,
+                third_comp,
+                third_context,
+                third_general_instruction,
+                third_round_instruction,
+                fourth_comp,
+                fourth_context,
+                fourth_general_instruction,
+                fourth_round_instruction,
+                ranking_first_comp,
+                ranking_second_comp,
+                ranking_third_comp,
+                ranking_fourth_comp,
+            ],
+        )
+    return demo
+if __name__ == "__main__":
+    file_path = os.path.join(ROOT_FILE, "./data/single_stock_data/experiment_processed_data.jsonl")
+    topics = [
+        "healthcare_growth_defensive",
+        "dividend_value_defensive",
+        "nondividend_value_cyclical",
+    ]
+    context_info_list = get_context_list(file_path)  # str to List of Dict
+    # system instruction consist of Task, Personality, and Context
+    """
+    Personality
+    ["extroverted", "introverted"]
+    ["agreeable", "antagonistic"]
+    ["conscientious", "unconscientious"]
+    ["neurotic", "emotionally stable"]
+    ["open to experience", "closed to experience"]]
+    """
+    # Global variables
+    terminator = ["<eos>", "<unk>", "<sep>", "<pad>", "<cls>", "<mask>"]
+    demo = create_demo()
+    user_list, demo_list = load_username_and_pwd()
+    demo.launch(
+        share=False,
+        # auth=user_list + demo_list + ["test", "test"],
+    )

components/chat_conversation.py ADDED Viewed

	@@ -0,0 +1,173 @@

+from components.induce_personality import construct_big_five_words
+from components.constant import (
+    ACCESS,
+    QUERY_REWRITING,
+    RAG,
+    PERSONALITY,
+    PERSONALITY_LIST,
+    REWRITE_PASSAGES,
+    NUM_PASSAGES,
+    DEVICE,
+    RESPONSE_GENERATOR,
+    TEMPLATE_PAYLOAD,
+)
+from components.prompt import SYSTEM_INSTRUCTION, RAG_INSTRUCTION, PERSONALITY_INSTRUCTION
+import requests
+import together
+def generate_response_debugging(history):
+    # outputs_text = "This is a test response"
+    outputs_text = " ".join([item["content"] for item in history])
+    history = history + [{"role": "assistant", "content": outputs_text}]
+    return outputs_text, history
+# REWRITER = "castorini/t5-base-canard"
+def generate_response_together_api(history, max_tokens, client, model="meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo"):
+    together_request = {
+        "model": model,
+        "messages": history,
+        "stream": False,
+        "logprobs": False,
+        "stop": ["<eos>", "<unk>", "<sep>", "<pad>", "<cls>", "<mask>"],
+        "max_tokens": max_tokens,
+    }
+    response = client.chat.completions.create(**together_request)
+    outputs_text = response.choices[0].message.content
+    history = history + [{"role": "assistant", "content": outputs_text}]
+    return outputs_text, history
+def make_local_api_call(payload, api_url):
+    try:
+        # Send the POST request to the API
+        response = requests.post(api_url, json=payload)
+        # Check if the request was successful
+        if response.status_code == 200:
+            result = response.json()
+            # Print the generated text
+            return result.get("text", [""])[0]
+            # if "logits" in result:
+            #     print(f"Logits: {result['logits']}")
+        else:
+            # If there was an error, print the status code and message
+            print(f"Error: {response.status_code}")
+            print(response.text)
+    except requests.exceptions.RequestException as e:
+        print(f"Request failed: {e}")
+def generate_response_local_api(history, terminator, max_tokens, api_url):
+    payload = TEMPLATE_PAYLOAD.copy()
+    payload.update(
+        {
+            "prompt": history,
+            "max_tokens": max_tokens,
+            "stop_token_ids": terminator,
+        }
+    )
+    # Call the API to generate the response
+    outputs_text = make_local_api_call(payload, api_url)
+    if outputs_text:
+        # Update history with the assistant's response
+        history = history + [{"role": "assistant", "content": outputs_text}]
+        return outputs_text, history
+    else:
+        print("Failed to generate a response.")
+        return "Generation failed", history  # Return the original history in case of failure
+def conversation_window(history, N=100):
+    if len(history) > N:
+        return history[2:]
+    return history
+def format_message_history(message, history):
+    if not history:
+        str_history = f"\n<user>: {message}\n<assistant>"
+    else:
+        # Query written
+        str_history = (
+            "".join(["".join(["\n<user>:" + item[0], "\n<assistant>:" + item[1]]) for item in history])
+            + f"\n<user>: {message}\n<assistant>"
+        )
+    return str_history
+def format_user_message(message, history):
+    return history + [{"role": "user", "content": message}]
+def format_context(message, history):
+    return [{"role": "system", "content": message}] + history
+def prepare_tokenizer(tokenizer):
+    special_tokens = ["<eos>", "<unk>", "<sep>", "<pad>", "<cls>", "<mask>"]
+    for token in special_tokens:
+        if tokenizer.convert_tokens_to_ids(token) is None:
+            tokenizer.add_tokens([token])
+    if tokenizer.eos_token_id is None:
+        tokenizer.eos_token_id = tokenizer.convert_tokens_to_ids("<eos>")
+    terminators = [
+        tokenizer.eos_token_id,
+        # self.pipeline.tokenizer.convert_tokens_to_ids(""),
+    ]
+    return tokenizer, terminators
+def gradio_to_huggingface_message(gradio_message):
+    huggingface_message = []
+    for user, bot in gradio_message:
+        huggingface_message.append({"role": "user", "content": user})
+        huggingface_message.append({"role": "assistant", "content": bot})
+    return huggingface_message
+def huggingface_to_gradio_message(huggingface_message):
+    gradio_message = []
+    store = []
+    for utter in huggingface_message:
+        if utter["role"] in ["user", "assistant"]:
+            if utter["role"] == "assistant":
+                store.append(utter["content"])
+                gradio_message.append(store)
+                store = []
+            else:
+                store.append(utter["content"])
+    return gradio_message
+def get_personality_instruction(personality):
+    return PERSONALITY_INSTRUCTION.format(personality)
+def get_system_instruction(rag=RAG, personality_list=None):
+    if rag and personality_list:
+        return (
+            SYSTEM_INSTRUCTION
+            + RAG_INSTRUCTION
+            + get_personality_instruction(construct_big_five_words(personality_list))
+        )
+    elif personality_list:
+        return SYSTEM_INSTRUCTION + get_personality_instruction(construct_big_five_words(personality_list))
+    elif rag:
+        return SYSTEM_INSTRUCTION + RAG_INSTRUCTION
+    else:
+        return SYSTEM_INSTRUCTION
+def format_rag_context(rag_context):
+    """
+    rag_context [{"passage_id": clue_web, "passage_text": "abc"}, ...]
+    """
+    passage_context = "Context: \n"
+    for passage_rank, info in enumerate(rag_context):
+        passage_context += f"Passage ID: {info['passage_id']}, Text: {info['passage_text']}\n\n"
+    return passage_context

components/constant.py ADDED Viewed

	@@ -0,0 +1,19 @@

+# Configuration Constants
+import os
+ACCESS = os.getenv("HF_ACCESS_TOKEN")
+QUERY_REWRITING = False
+RAG = False
+PERSONALITY = True
+PERSONALITY_LIST = ["introverted", "antagonistic", "conscientious", "emotionally stable", "open to experience"]
+REWRITE_PASSAGES = False
+NUM_PASSAGES = 3
+DEVICE = "cuda"
+RESPONSE_GENERATOR = "meta-llama/Meta-Llama-3.1-8B-Instruct"
+CONV_WINDOW = 100
+API_URL = "http://10.249.1.2:8888/generate"
+TEMPLATE_PAYLOAD = {
+    "stream": False,  # Set to True if you want to stream the results
+    "logprobs": False,  # Set to True if you want the log probabilities of the tokens
+    "include_prompt": False,  # Whether to include the original prompt in the response}
+}

components/induce_personality.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import itertools
+personality_types = [["extroverted", "introverted"], ["agreeable", "antagonistic"], ["conscientious", "unconscientious"], ["neurotic", "emotionally stable"], ["open to experience", "closed to experience"]]
+def construct_big_five_words(persona_type: list):
+    """Construct the list of personality traits
+    e.g., introverted + antagonistic + conscientious + emotionally stable + open to experience
+    """
+    options = list(persona_type)
+    assert options[0] in ["extroverted", "introverted"], "Invalid personality type"
+    assert options[1] in ["agreeable", "antagonistic"], "Invalid personality type"
+    assert options[2] in ["conscientious", "unconscientious"], "Invalid personality type"
+    assert options[3] in ["neurotic", "emotionally stable"], "Invalid personality type"
+    assert options[4] in ["open to experience", "closed to experience"], "Invalid personality type"
+    last_item = "and " + options[-1]
+    options[-1] = last_item
+    return ", ".join(options)
+def build_personality_prompt(persona_type: list):
+    return "You are a character who is {}.".format(construct_big_five_words(persona_type))
+if __name__ == "__main__":
+    count = 0
+    for persona_type in itertools.product(*personality_types):
+        system_prompt = "You are a character who is {}.".format(construct_big_five_words(persona_type))
+        print(system_prompt)
+        print("\n")
+        count += 1
+        if count == 5:
+            break

components/prompt.py ADDED Viewed

	@@ -0,0 +1,10 @@

+SYSTEM_INSTRUCTION = """You are an AI financial advisor. Help the client by answering their questions based on conversation history and retrieved passages it if it is relevant and useful for answering the question."""
+RAG_INSTRUCTION = """The retrieved passages are contained in the context. With the information contained in the context, give a comprehensive answer to the query.  Only use the context if it is relevant and useful for answering the question. Your response should be concise and directly address the question asked. When applicable, mention the source document number."""
+PERSONALITY_INSTRUCTION = """You are a character who is {}"""
+DEMONSTRATION = """You are an AI financial advisor. Help the client by answering their questions based on retrieved passages from the web and conversation history. Only respond to the user’s latest message and only finish passages starting with <assistant> do not write <user> part.
+Retrieved passages:
+{}
+Here is the conversation history:
+{}
+"""

components/query_rewriting.py ADDED Viewed

	@@ -0,0 +1,60 @@

+from components.rag_components import get_length_without_special_tokens
+import ipdb
+QUERY_REWRITING = """Given a user query and its context (conversational history), decontextualize the question by addressing coreference and omission issues. The resulting question should retain its original meaning and be as informative as possible, and should not duplicate any previously asked questions in the context. JUST ANSWER THE RESOLVED QUERY WITHOUT ANY OTHER SENTENCES.\nContext: {}\n"""
+REMINDER = """\nRemember you are a query rewriter. JUST ANSWER THE RESOLVED QUERY WITHOUT ANY OTHER SENTENCES."""
+def get_context_from_message_history(message_history):
+    context = ""
+    for message in message_history:
+        if message["role"] not in ["system"]:
+            context += f'{message["role"]}: {message["content"]}\n'
+    return context if context else "No context available."
+def rewrite_query(query: str, history: str, rewriter, rewriter_tokenizer, rewriter_terminator, device="cuda", max_tokens=256, temperature=0.0, top_p=0.9) -> str:
+    # ipdb.set_trace()
+    # DELETE LAST \n<assistant>\n
+    history = "\n".join(history.split("\n")[:-1])
+    system_prompt = QUERY_REWRITING.format(history)
+    query += REMINDER
+    user_prompt = [{"role": "system", "content": system_prompt}, {"role": "user", "content": f"user query: {query}"}]
+    prompt = rewriter_tokenizer.apply_chat_template(user_prompt, tokenize=False, add_generation_prompt=True)
+    print("user_prompt:", user_prompt)
+    print("PROMPT:", prompt)
+    # ipdb.set_trace()
+    print("System Prompt:", system_prompt)
+    print("Prompt:", prompt)
+    inputs = rewriter_tokenizer(prompt, return_tensors="pt").to(rewriter.device)
+    outputs = rewriter.generate(
+        **inputs,
+        max_new_tokens=max_tokens,
+        eos_token_id=rewriter_terminator,
+        do_sample=False,  # Greedy decoding to be deterministic
+        # temperature=temperature,
+        top_p=top_p,
+    )
+    prompt_length = get_length_without_special_tokens(prompt, rewriter_tokenizer)
+    response = rewriter_tokenizer.decode(outputs[0], skip_special_tokens=True)[prompt_length:]
+    return response.strip()
+# def rewrite_query(query: str, history: str, rewriter, rewriter_tokenizer, device="cuda") -> str:
+#     context = "|||".join([history, query])
+#     # rewriter = AutoModelForSeq2SeqLM.from_pretrained(model_name).to(device).eval()
+#     # rewriter_tokenizer = AutoTokenizer.from_pretrained(model_name)
+#     tokenized_context = rewriter_tokenizer.encode(context, return_tensors="pt").to(device)
+#     output_ids = rewriter.generate(
+#       tokenized_context,
+#       max_length=200,
+#       num_beams=4,
+#       repetition_penalty=2.5,
+#       length_penalty=1.0,
+#       early_stopping=True
+#     ).to(device)
+#     rewrite = rewriter_tokenizer.decode(output_ids[0], skip_special_tokens=True)
+#     return rewrite

components/rag_components.py ADDED Viewed

	@@ -0,0 +1,190 @@

+import os
+import json
+# Load model and tokenizer from HuggingFace
+import numpy as np
+import pandas as pd
+import torch
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
+from sentence_transformers import CrossEncoder
+# from pyserini.search.lucene import LuceneSearcher
+import pyterrier as pt
+from pyterrier_t5 import MonoT5ReRanker, DuoT5ReRanker
+if not pt.started():
+    pt.init()
+import ipdb
+def extract_context(json_data, number, turn_id):
+    # Find the correct dictionary with the given number
+    data = None
+    for item in json_data:
+        if item["number"] == number:
+            data = item
+            break
+    # If we couldn't find the data for the given number
+    if not data:
+        print("No data found for the given number.")
+        return "No data found for the given number.", None
+    # Extract the utterance and response values
+    texts = []
+    current_utterance = ""
+    for turn in data["turns"]:
+        if turn["turn_id"] < turn_id:
+            texts.append(turn["utterance"])
+            texts.append(turn["response"])
+        elif turn["turn_id"] == turn_id:
+            current_utterance = turn["utterance"]
+            texts.append(current_utterance)
+    # Join the texts with "|||" separator
+    context = "|||".join(texts)
+    return current_utterance, context
+def escape_special_characters(query):
+    # Escaping special characters
+    special_chars = ["?", "&", "|", "!", "{", "}", "[", "]", "^", "~", "*", ":", '"', "+", "-", "(", ")"]
+    for char in special_chars:
+        query = query.replace(char, "")
+    return query
+def str_to_df_query(query):
+    if isinstance(query, str):
+        query = escape_special_characters(query)
+        return pd.DataFrame([[1, query]], columns=["qid", "query"])
+    elif isinstance(query, list):
+        query = [escape_special_characters(q) for q in query]
+        return pd.DataFrame([[i + 1, q] for i, q in enumerate(query)], columns=["qid", "query"])
+    else:
+        raise ValueError("The query must be a string or a list of strings.")
+def retrieve_and_rerank(query, pipeline):
+    query_df = str_to_df_query(query)
+    res = pipeline.transform(query_df)
+    candidate_set = []
+    for i, row in res.iterrows():
+        passage_id = row["docno"]
+        rank = row["rank"]
+        score = row["score"]
+        passage_text = row["text"]
+        candidate_set.append({"passage_id": passage_id, "rank": i + 1, "score": score, "passage_text": passage_text})
+    return candidate_set
+def rerank_passages(query, passages, reranker):
+    res = []
+    query_passage_pairs = [[query, passage["passage_text"]] for passage in passages]
+    scores = reranker.predict(query_passage_pairs)
+    for passage, score in zip(passages, scores):
+        passage["reranker_score"] = score
+        res.append(passage)
+    ranked_passages = sorted(passages, key=lambda x: x["reranker_score"], reverse=True)
+    return ranked_passages
+def rag(rewrite, top_n_passages=3):
+    # Set up
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    # Set Up Index
+    index_path = os.path.join("/root/nfs/iKAT/2023/ikat_index/index_pyterrier_with_text", "data.properties")
+    index = pt.IndexFactory.of(index_path)
+    # Set up Pipeline for retrieval and reranking
+    bm25 = pt.BatchRetrieve(index, wmodel="BM25", metadata=["docno", "text"])
+    monoT5 = MonoT5ReRanker()
+    pipeline = (bm25 % 10) >> pt.text.get_text(index, "text") >> (monoT5 % 5) >> pt.text.get_text(index, "text")
+    # Passage retrieval and reranking
+    reranked_passages = retrieve_and_rerank(rewrite, pipeline)
+    passages = [{"passage_id": passage["passage_id"], "passage_text": passage["passage_text"]} for passage in reranked_passages][:top_n_passages]
+    return passages
+def retrieve_passage(resolved_query, history, RAG, top_n_passages=3):
+    # TODO: RAG function
+    if RAG:
+        if len(history) >= 1:
+            rag_context = rag(resolved_query, top_n_passages)
+        else:
+            rag_context = rag(
+                resolved_query,
+            )
+    else:
+        rag_context = "No Context"
+    return rag_context
+def get_length_without_special_tokens(text, tokenizer):
+    # Tokenize the prompt and get input IDs
+    inputs = tokenizer(text, return_tensors="pt")
+    # Extract the input IDs from the tokenized output
+    input_ids = inputs.input_ids[0]
+    # Decode the input IDs to a string, skipping special tokens
+    decoded_text = tokenizer.decode(input_ids, skip_special_tokens=True)
+    return len(decoded_text)
+def response_generation(messages, model, tokenizer, device, terminators, max_tokens=512, temperature=0.0, top_p=0.9):
+    prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
+    inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
+    outputs = model.generate(
+        **inputs,
+        max_new_tokens=max_tokens,
+        eos_token_id=terminators,
+        do_sample=False,  # Greedy_decoding to be deterministic
+        # temperature=temperature,
+        top_p=top_p,
+    )
+    prompt_length = get_length_without_special_tokens(prompt, tokenizer)
+    response = tokenizer.decode(outputs[0], skip_special_tokens=True)[prompt_length:]
+    # ipdb.set_trace()
+    return response.strip(), messages + [{"role": "assistant", "content": response.strip()}]
+if __name__ == "__main__":
+    # Set up
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    demo_path = "/nfs/primary/iKAT/2023/"
+    with open(os.path.join(demo_path, "ikat_demo/test.json"), "r") as f:
+        topics = json.load(f)
+    # Set up Index
+    index_path = os.path.join("/root/nfs/iKAT/2023/index_pyterrier_with_text", "data.properties")
+    index = pt.IndexFactory.of(index_path)
+    # Set up Pipeline for retrieval and reranking
+    bm25 = pt.BatchRetrieve(index, wmodel="BM25", metadata=["docno", "text"])
+    monoT5 = MonoT5ReRanker()
+    pipeline = (bm25 % 10) >> pt.text.get_text(index, "text") >> (monoT5 % 5) >> pt.text.get_text(index, "text")
+    query = "Can you compare mozzarella with plant-based cheese?"
+    # Query rewriting
+    rewriter = AutoModelForSeq2SeqLM.from_pretrained("castorini/t5-base-canard").to(device).eval()
+    rewriter_tokenizer = AutoTokenizer.from_pretrained("castorini/t5-base-canard")
+    number_to_search = "10-1"
+    turn_id_to_search = 6
+    utterance, context = extract_context(topics, number_to_search, turn_id_to_search)
+    rewrite = rewrite_query(context, rewriter, rewriter_tokenizer, device)
+    # Passage Retrieval and Reranking
+    reranked_passages = retrieve_and_rerank(rewrite, pipeline)
+    # Response generation
+    summarizer = AutoModelForSeq2SeqLM.from_pretrained("mrm8488/t5-base-finetuned-summarize-news")
+    summarizer_tokenizer = AutoTokenizer.from_pretrained("mrm8488/t5-base-finetuned-summarize-news")
+    # We use the top-3 reranked passages to generate a response
+    passages = [passage["passage_text"] for passage in reranked_passages][:3]
+    print(json.dumps(passages, indent=4))
+    responses = generate_response(passages, summarizer, summarizer_tokenizer)
+    print("Done")

components/rewrite_passages.py ADDED Viewed

	@@ -0,0 +1,94 @@

+from components.rag_components import get_length_without_special_tokens
+REWRITE_PASSAGE_PROMPT = """
+A passage has been retrieved from the web based on the query: {}. Please extract only the information that is essential for answering this query with at most two or three sentences. If the passage contains no relevant information, do not extract anything. Provide the extracted information directly without any introductory phrases or additional context.
+Query: {}\n
+Passage: {}\n
+"""
+def rewrite_rag_context(resolved_query, rag_context, model, tokenizer, terminator):
+    """
+    Rewrites the passages in the RAG context based on the resolved query.
+    Args:
+        resolved_query (str): The resolved user query.
+        rag_context (list): A list of dictionaries, each containing 'passage_id' and 'passage_text'.
+        model: The model used for generating rewritten passages.
+        tokenizer: The tokenizer used for processing text.
+        terminator: The terminator token for the model.
+    Returns:
+        list: A list of dictionaries with rewritten passages.
+    """
+    retrieved_passages = []
+    for passage in rag_context:
+        rewrite = rewrite_passage(resolved_query, passage["passage_text"], model, tokenizer, terminator)
+        retrieved_passages.append({"passage_id": passage["passage_id"], "passage_text": rewrite})
+    return retrieved_passages
+def rewrite_passage(resolved_query, passage, model, tokenizer, terminator, max_tokens=256, temperature=0.0, top_p=0.9):
+    """
+    Rewrites a single passage based on the resolved query.
+    Args:
+        resolved_query (str): The resolved user query.
+        passage (str): The passage text to be rewritten.
+        model: The model used for generating rewritten passages.
+        tokenizer: The tokenizer used for processing text.
+        terminator: The terminator token for the model.
+        max_tokens (int): The maximum number of tokens to generate. Default is 256.
+        temperature (float): The temperature for sampling. Default is 0.6.
+        top_p (float): The nucleus sampling probability. Default is 0.9.
+    Returns:
+        str: The rewritten passage.
+    """
+    chatbot = []
+    user_prompt = REWRITE_PASSAGE_PROMPT.format(resolved_query, passage, passage)
+    chatbot.append({"role": "user", "content": user_prompt})
+    prompt = tokenizer.apply_chat_template(chatbot, tokenize=False, add_generation_prompt=True)
+    inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
+    outputs = model.generate(
+        **inputs,
+        max_new_tokens=max_tokens,
+        eos_token_id=terminator,
+        do_sample=False,  # Greedy decoding to be deterministic
+        # temperature=temperature
+        top_p=top_p,
+    )
+    prompt_length = get_length_without_special_tokens(prompt, tokenizer)
+    response = tokenizer.decode(outputs[0], skip_special_tokens=True)[prompt_length:]
+    return response.strip()
+# def rewrite_rag_context(resoloved_query, rag_context, model, tokenizer, terminator):
+#     """
+#     rag_context: [{"passage_id": passage["passage_id"], "passage_text": passage['passage_text']} for passage in reranked_passages]
+#     """
+#     retrieved_passages = []
+#     for passage in rag_context:
+#         rewrite = rewrite_passage(resoloved_query, passage["passage_text"], model, tokenizer, terminator)
+#         retrieved_passages.append([{"passage_id": passage["passage_id"], "passage_text":rewrite}])
+#     return retrieved_passages
+# def rewrite_passage(resoloved_query, passage, model, tokenizer, terminator, max_tokens=256, temperature=0.6, top_p=0.9):
+#     chatbot = []
+#     user_prompt = REWRITE_PASSAGE_PROMPT.format(resoloved_query, passage, passage)
+#     chatbot.append({"role": "user", "content": message})
+#     prompt = tokenizer.apply_chat_template(chatbot, tokenize=False, add_generation_prompt=True)
+#     outputs = model.generate(
+#         **inputs,
+#         max_new_tokens=max_tokens,
+#         eos_token_id=terminators,
+#         do_sample=True,
+#         temperature=temperature,
+#         top_p=top_p,
+#     )
+#     prompt_length = get_length_without_special_tokens(prompt, tokenizer)
+#     response = tokenizer.decode(outputs[0], skip_special_tokens=True)[prompt_length:]
+#     return response.strip()

data/single_stock_data/experiment_processed_data.jsonl ADDED Viewed

	@@ -0,0 +1,3 @@

+{"topic": "healthcare_growth_defensive", "data": [{"ticker": "LLY", "sector": "Healthcare", "industry": "Drug Manufacturers - General", "business_summary": "Eli Lilly and Company discovers, develops, and markets human pharmaceuticals worldwide. The company offers Basaglar, Humalog, Humalog Mix 75/25, Humalog U-100, Humalog U-200, Humalog Mix 50/50, insulin lispro, insulin lispro protamine, insulin lispro mix 75/25, Humulin, Humulin 70/30, Humulin N, Humulin R, and Humulin U-500 for diabetes; Jardiance, Mounjaro, and Trulicity for type 2 diabetes; and Zepbound for obesity. It also provides oncology products, including Alimta, Cyramza, Erbitux, Jaypirca, Retevmo, Tyvyt, and Verzenio. In addition, the company offers Olumiant for rheumatoid arthritis, atopic dermatitis, severe alopecia areata, and COVID-19; Taltz for plaque psoriasis, psoriatic arthritis, ankylosing spondylitis, and non-radiographic axial spondylarthritis; Omvoh for ulcerative colitis; Cymbalta for depressive disorder, diabetic peripheral neuropathic pain, generalized anxiety disorder, fibromyalgia, and chronic musculoskeletal pain; Ebglyss for severe atopic dermatitis; and Emgality for migraine prevention and episodic cluster headache. Further, it provides Cialis for erectile dysfunction and benign prostatic hyperplasia; and Forteo for osteoporosis. The company operates Lilly Seaport Innovation Center (LSC), a research and development facility in the Boston Seaport to advancing Lilly's efforts in RNA and DNA-based therapies as well as discovering new drug targets to create life-changing medicines across several disease states, including diabetes, obesity, cardiovascular diseases, neurodegeneration, and chronic pain. It has collaborations with Incyte Corporation; Boehringer Ingelheim Pharmaceuticals, Inc.; F. Hoffmann-La Roche Ltd and Genentech, Inc.; Biologics, Inc., AbCellera Biologics Inc.; and Chugai Pharmaceutical Co., Ltd, as well as development collaboration with Eli Lilly and Company for developing QIAstat-Dx IVD panel, for the detection of various APOE genotypes. The company was founded in 1876 and is headquartered in Indianapolis, Indiana.", "beta": 0.416, "short_name": "Eli Lilly and Company", "long_name": "Eli Lilly and Company", "price_data": "2023 Monthly Stock Price: Jan: 339.14, Feb: 307.68, Mar: 339.52, Apr: 391.36, May: 425.68, Jun: 464.85, Jul: 450.55, Aug: 550.50, Sep: 533.55, Oct: 550.23, Nov: 588.18, Dec: 580.10", "earning_summary": "Based on the provided conference call transcript, here's a summary of the key financial metrics discussed:\n\n1.  **Revenue Growth**: Lilly's revenue increased 28% in Q2 2023 compared to Q2 2022. Excluding revenue from Baqsimi and COVID-19 antibodies, revenue grew 22% or 23% on a constant currency basis.\n2.  **Gross Margin**: Gross margin as a percent of revenue was flat in Q2 at 79.8%. Gross margin benefited from product mix, including one-time revenue from the sales of rights to Baqsimi, which was offset by increases in manufacturing expenses related to labor costs and investments in capacity expansion.\n3.  **Operating Expenses**: Total operating expenses increased 14% in Q2. Marketing, selling, and administrative expenses increased 18%, driven by higher marketing and selling expenses associated with recent and upcoming new product launches and additional indications. R&D expenses increased 32%, driven by higher development expenses for late-stage assets and additional investments in early-stage research.\n4.  **Operating Income**: Operating income increased 69% in Q2 driven by higher revenue, including revenue associated with the sales of rights for Baqsimi and lower IPR&D charges, partially offset by higher R&D and SG&A expenses.\n5.  **EPS**: Earnings per share (EPS) was $2.11 in Q2, a 69% increase versus Q2 of 2022, inclusive of $0.43 of EPS associated with the sales of rights for Baqsimi.\n6.  **Price, Rate, and Volume**: In the U.S., net price increased 2% for the quarter driven by Mounjaro access and savings cards dynamics. Excluding Mounjaro, net price in the U.S. decreased by low single digits, consistent with prior trends.\n7.  **Guidance**: Lilly updated its 2023 financial guidance, increasing revenue guidance by $2.2 billion to a range of $33.4 billion to $33.9 billion. The company also increased its guidance for gross margin as a percent of revenue to approximately 80%, driven by the sales of rights for Baqsimi and its olanzapine portfolio. Operating expense guidance was also increased, with marketing, selling, and administrative costs expected to be in the range of $7.2 billion to $7.4 billion, and research and development expenses expected to be in the range of $8.9", "topic": "healthcare_growth_defensive", "user_narrative": "**Name**: Alex Carter\n**Age**: 27\n**Occupation**: Healthcare Consultant\n**Marital Status**: Single\n**Children**: None\nAlex is a driven healthcare consultant who has been working in the industry for a few years. With a deep interest in healthcare, Alex is passionate about staying informed on medical innovations and the future of biotech companies. Although still in the early stages of their career, Alex is motivated by both personal and professional growth.\nTheir financial goals focus on growing wealth over time, particularly through investing in industries they understand. Alex\u2019s work has made them familiar with the unpredictable nature of the healthcare industry, but Alex maintains a strong belief in its potential for growth.\nAlex is not overly conservative and is willing to take measured risks, favoring rapidly expanding companies over those with more stable, predictable growth. Concerned about market downturns, Alex seeks stocks that can withstand economic shifts. Alex is uninterested in dividends, focusing instead on investments with strong potential for capital gains.", "label": 1}, {"ticker": "JNJ", "sector": "Healthcare", "industry": "Drug Manufacturers - General", "business_summary": "Johnson & Johnson, together with its subsidiaries, researches, develops, manufactures, and sells various products in the healthcare field worldwide. The company's Innovative Medicine segment offers products for various therapeutic areas, such as immunology, including rheumatoid arthritis, psoriatic arthritis, inflammatory bowel disease, and psoriasis; infectious diseases comprising HIV/AIDS; neuroscience, consisting of mood disorders, neurodegenerative disorders, and schizophrenia; oncology, such as prostate cancer, hematologic malignancies, lung cancer, and bladder cancer; cardiovascular and metabolism, including thrombosis, diabetes, and macular degeneration; and pulmonary hypertension comprising pulmonary arterial hypertension through retailers, wholesalers, distributors, hospitals, and healthcare professionals for prescription use. Its MedTech segment provides Interventional Solutions, including electrophysiology products to treat heart rhythm disorders; the heart recovery portfolio, which includes technologies to treat severe coronary artery disease requiring high-risk PCI or AMI cardiogenic shock; and neurovascular care that treats hemorrhagic and ischemic stroke. this segment also offers an orthopaedics portfolio that includes products and enabling technologies that support hips, knees, trauma, spine, sports, and other; surgery portfolios comprising advanced and general surgery technologies, as well as solutions for breast aesthetics, ear, nose, and throat procedures; contact lenses under the ACUVUE Brand; and TECNIS intraocular lenses for cataract surgery. It distributes its products to wholesalers, hospitals, and retailers, as well as physicians, nurses, hospitals, eye care professionals, and clinics. Johnson & Johnson was founded in 1886 and is based in New Brunswick, New Jersey.", "beta": 0.518, "short_name": "Johnson & Johnson", "long_name": "Johnson & Johnson", "price_data": "2023 Monthly Stock Price: Jan: 156.15, Feb: 147.49, Mar: 149.17, Apr: 157.54, May: 150.35, Jun: 160.50, Jul: 162.44, Aug: 157.91, Sep: 152.12, Oct: 144.88, Nov: 152.26, Dec: 154.31", "earning_summary": "Based on the provided conference call transcript, here's a detailed summary of the key financial metrics discussed:\n\n**Revenue and Sales:**\n\n* Worldwide sales: $21.4 billion, an increase of 6.8% versus the third quarter of 2022.\n* Operational sales growth: 6.4% (excluding the effect of translational currency).\n* U.S. sales: $11.1% increase.\n* Regions outside the U.S.: 1.6% reported growth, 0.7% operational growth.\n* Innovative medicine sales: $13.9 billion, an increase of 5.1% (excluding COVID-19 vaccine sales, worldwide operational sales growth was 8.2%).\n* MedTech sales: $7.5 billion, an increase of 10% (excluding the impact of acquisition and divestitures, worldwide adjusted operational sales growth was 6%).\n\n**Earnings:**\n\n* Net earnings: $4.3 billion.\n* Diluted earnings per share: $1.69.\n* Adjusted net earnings: $6.8 billion, an increase of 14.1% compared to the third quarter of 2022.\n* Adjusted diluted earnings per share: $2.66, an increase of 19.3% compared to the third quarter of 2022.\n\n**Guidance Update:**\n\n* Full-year sales guidance: $84.4 billion to $84.8 billion (constant currency basis), an increase of 8.5% to 9.0% (operational sales growth).\n* Adjusted operational sales growth: 7.2% to 7.7%.\n* Adjusted pre-tax operating margin: expected to improve by approximately 50 basis points versus prior year.\n* Net other income: $1.7 billion to $1.9 billion.\n* Net interest income: $300 million to $400 million.\n* Effective tax rate: 15.0% to 15.5%.\n\n**Cash and Capital Allocation:**\n\n* Cash and marketable securities: approximately $24 billion.\n* Debt: approximately $30 billion.\n* Net debt position: $6 billion.\n* Free cash flow: approximately $12 billion (year-to-date through the third quarter).\n\n**Preliminary Perspectives for 2024:**\n\n* Innovative medicine: confident in delivering growth from key brands and newly launched products, with continued progress from the pipeline.\n* MedTech: expect commercial capabilities and continued adoption of recently launched products to drive growth and improve competitiveness", "topic": "healthcare_growth_defensive", "user_narrative": "**Name**: Alex Carter\n**Age**: 27\n**Occupation**: Healthcare Consultant\n**Marital Status**: Single\n**Children**: None\nAlex is a driven healthcare consultant who has been working in the industry for a few years. With a deep interest in healthcare, Alex is passionate about staying informed on medical innovations and the future of biotech companies. Although still in the early stages of their career, Alex is motivated by both personal and professional growth.\nTheir financial goals focus on growing wealth over time, particularly through investing in industries they understand. Alex\u2019s work has made them familiar with the unpredictable nature of the healthcare industry, but Alex maintains a strong belief in its potential for growth.\nAlex is not overly conservative and is willing to take measured risks, favoring rapidly expanding companies over those with more stable, predictable growth. Concerned about market downturns, Alex seeks stocks that can withstand economic shifts. Alex is uninterested in dividends, focusing instead on investments with strong potential for capital gains.", "label": 2}, {"ticker": "PM", "sector": "Consumer Defensive", "industry": "Tobacco", "business_summary": "Philip Morris International Inc. operates as a tobacco company working to delivers a smoke-free future and evolving portfolio for the long-term to include products outside of the tobacco and nicotine sector. The company's product portfolio primarily consists of cigarettes and smoke-free products, including heat-not-burn, vapor, and oral nicotine products primarily under the IQOS and ZYN brands; and consumer accessories, such as lighters and matches. It also offers wellness and healthcare products. Philip Morris International Inc. was incorporated in 1987 and is headquartered in Stamford, Connecticut.", "beta": 0.576, "short_name": "Philip Morris International Inc", "long_name": "Philip Morris International Inc.", "price_data": "2023 Monthly Stock Price: Jan: 96.12, Feb: 89.73, Mar: 90.89, Apr: 93.43, May: 84.12, Jun: 92.45, Jul: 94.44, Aug: 90.97, Sep: 88.91, Oct: 85.63, Nov: 89.66, Dec: 91.60", "earning_summary": "Based on the provided transcript, here's a detailed summary of the key financial metrics discussed during the Q3 2023 earnings call of Philip Morris International Inc. (PMI):\n\n**Key Highlights:**\n\n1.  **Revenue Growth:** PMI reported a strong Q3 2023 with net revenues of $9 billion, a 9.3% organic net revenue growth, and a 20.3% adjusted diluted EPS growth.\n2.  **Volume Growth:** Total shipment volume increased by 2.2% in Q3 and 1.5% year-to-date, with HTU shipment volumes growing by 18% in Q3.\n3.  **IQOS Performance:** IQOS HTU shipment volumes grew by 18% in Q3, with a 16.5% organic net revenue growth from smoke-free products.\n4.  **ZYN Performance:** ZYN delivered a remarkable 66% volume growth in Q3, with a 70.8% category volume share and 76% retail value share in the US.\n5.  **Operating Income Growth:** Adjusted operating income grew by 11.3% organically, with a 70 basis points organic margin expansion.\n6.  **Cost Management:** PMI delivered a further $120 million in gross cost efficiencies in Q3, surpassing the $2 billion target for 2021-2023.\n7.  **Full-Year Outlook:** PMI raised its volume, organic sales growth, and currency-neutral adjusted bottom-line growth forecast, with a 1% to 2% cigarette volume decline and a 390 million to 410 million cans of nicotine pouch forecast.\n8.  **Dividend:** PMI has delivered 16 years of continuous dividend increase since 2008, with a cumulative 183% increase and a CAGR of 77.2%.\n\n**Key Financial Metrics:**\n\n1.  **Net Revenues:** $9 billion (Q3 2023)\n2.  **Organic Net Revenue Growth:** 9.3% (Q3 2023)\n3.  **Adjusted Diluted EPS Growth:** 20.3% (Q3 2023)\n4.  **Total Shipment Volume:** 2.2% growth (Q3 2023)\n5.  **HTU Shipment Volumes:** 18% growth (Q3 2023)\n6.  **IQOS HTU Shipment Volumes:** 18% growth (Q3", "topic": "healthcare_growth_defensive", "user_narrative": "**Name**: Alex Carter\n**Age**: 27\n**Occupation**: Healthcare Consultant\n**Marital Status**: Single\n**Children**: None\nAlex is a driven healthcare consultant who has been working in the industry for a few years. With a deep interest in healthcare, Alex is passionate about staying informed on medical innovations and the future of biotech companies. Although still in the early stages of their career, Alex is motivated by both personal and professional growth.\nTheir financial goals focus on growing wealth over time, particularly through investing in industries they understand. Alex\u2019s work has made them familiar with the unpredictable nature of the healthcare industry, but Alex maintains a strong belief in its potential for growth.\nAlex is not overly conservative and is willing to take measured risks, favoring rapidly expanding companies over those with more stable, predictable growth. Concerned about market downturns, Alex seeks stocks that can withstand economic shifts. Alex is uninterested in dividends, focusing instead on investments with strong potential for capital gains.", "label": 3}, {"ticker": "XOM", "sector": "Energy", "industry": "Oil & Gas Integrated", "business_summary": "Exxon Mobil Corporation engages in the exploration and production of crude oil and natural gas in the United States and internationally. It operates through Upstream, Energy Products, Chemical Products, and Specialty Products segments. The Upstream segment explores for and produces crude oil and natural gas. The Energy Products segment offers fuels, aromatics, and catalysts, as well as licensing services. It sells its products under the Exxon, Esso, and Mobil brands. The Chemical Products segment manufactures and markets petrochemicals including olefins, polyolefins, and intermediates. The Specialty Products segment offers performance products, including lubricants, basestocks, waxes, synthetics, elastomers, and resins. The company also involves in the manufacturing, trade, transport, and sale of crude oil, natural gas, petroleum products, petrochemicals, and other specialty products; and pursuit lower-emission business opportunities, including carbon capture and storage, hydrogen, lower-emission fuels, and lithium. Exxon Mobil Corporation was founded in 1870 and is based in Spring, Texas.", "beta": 0.877, "short_name": "Exxon Mobil Corporation", "long_name": "Exxon Mobil Corporation", "price_data": "2023 Monthly Stock Price: Jan: 109.37, Feb: 104.42, Mar: 104.18, Apr: 112.43, May: 97.92, Jun: 102.77, Jul: 102.76, Aug: 107.42, Sep: 113.60, Oct: 102.26, Nov: 100.17, Dec: 97.48", "earning_summary": "**Summary of Key Financial Metrics:**\n\n1.  **Earnings:** Exxon Mobil Corporation reported $9.1 billion in earnings for the third quarter of 2023, a $1.2 billion increase from the previous quarter.\n2.  **Cash Flow from Operations:** The company generated $16 billion in cash flow from operations during the third quarter.\n3.  **Dividend:** Exxon Mobil announced a 4% increase to the quarterly dividend to $0.95 per share, marking the 41st consecutive year of annual dividend increases.\n4.  **Capital Expenditures (Capex):** The company's capex investments for the year-to-date are $18.6 billion, on track to finish the year at the top end of the guidance range.\n5.  **Production:** Exxon Mobil's year-to-date production of 3.7 million oil-equivalent barrels per day is on track with the full-year guidance.\n6.  **Shareholder Distributions:** The company delivered $8.1 billion in shareholder distributions in the third quarter, consisting of $3.7 billion in dividends and $4.4 billion in share repurchases.\n7.  **Pioneer Natural Resources Acquisition:** Exxon Mobil expects to close the acquisition of Pioneer Natural Resources in early November, with synergies of approximately $1 billion before tax annually, beginning in the second year post-closing, and an average of about $2 billion per year over the next decade.\n8.  **Permian Production:** The combined Permian production is expected to increase to approximately 2 million oil-equivalent barrels per day by the end of 2027.\n9.  **Guyana Production:** Exxon Mobil's production in Guyana is expected to increase, with the company aiming to keep the FPSOs filled and striving to achieve maximum production.\n10. **Capex Guidance:** The company's capex guidance for the year is being updated, with the top end of the range being the new target, and the company is expected to provide further guidance in December.\n\n**Key Takeaways:**\n\n*   Exxon Mobil's earnings and cash flow from operations continue to be strong, driven by the company's operational performance and structural earnings improvements.\n*   The company's dividend increase and shareholder distributions demonstrate its commitment to returning value to shareholders.\n*   The acquisition of Pioneer Natural Resources is expected to strengthen Exxon Mobil's position in the Permian Basin and drive synergies and growth.\n*   The company's focus on high-return, advantaged projects and its efforts to", "topic": "healthcare_growth_defensive", "user_narrative": "**Name**: Alex Carter\n**Age**: 27\n**Occupation**: Healthcare Consultant\n**Marital Status**: Single\n**Children**: None\nAlex is a driven healthcare consultant who has been working in the industry for a few years. With a deep interest in healthcare, Alex is passionate about staying informed on medical innovations and the future of biotech companies. Although still in the early stages of their career, Alex is motivated by both personal and professional growth.\nTheir financial goals focus on growing wealth over time, particularly through investing in industries they understand. Alex\u2019s work has made them familiar with the unpredictable nature of the healthcare industry, but Alex maintains a strong belief in its potential for growth.\nAlex is not overly conservative and is willing to take measured risks, favoring rapidly expanding companies over those with more stable, predictable growth. Concerned about market downturns, Alex seeks stocks that can withstand economic shifts. Alex is uninterested in dividends, focusing instead on investments with strong potential for capital gains.", "label": 4}]}
+{"topic": "dividend_value_defensive", "data": [{"ticker": "AMZN", "sector": "Consumer Cyclical", "industry": "Internet Retail", "business_summary": "Amazon.com, Inc. engages in the retail sale of consumer products, advertising, and subscriptions service through online and physical stores in North America and internationally. The company operates through three segments: North America, International, and Amazon Web Services (AWS). It also manufactures and sells electronic devices, including Kindle, Fire tablets, Fire TVs, Echo, Ring, Blink, and eero; and develops and produces media content. In addition, the company offers programs that enable sellers to sell their products in its stores; and programs that allow authors, independent publishers, musicians, filmmakers, Twitch streamers, skill and app developers, and others to publish and sell content. Further, it provides compute, storage, database, analytics, machine learning, and other services, as well as advertising services through programs, such as sponsored ads, display, and video advertising. Additionally, the company offers Amazon Prime, a membership program. The company's products offered through its stores include merchandise and content purchased for resale and products offered by third-party sellers. It serves consumers, sellers, developers, enterprises, content creators, advertisers, and employees. Amazon.com, Inc. was incorporated in 1994 and is headquartered in Seattle, Washington.", "beta": 1.147, "short_name": "Amazon.com, Inc.", "long_name": "Amazon.com, Inc.", "price_data": "2023 Monthly Stock Price: Jan: 103.13, Feb: 94.23, Mar: 103.29, Apr: 105.45, May: 120.58, Jun: 130.36, Jul: 133.68, Aug: 138.01, Sep: 127.12, Oct: 133.09, Nov: 146.09, Dec: 151.94", "earning_summary": "Based on the provided conference call transcript, here's a summary of the key financial metrics and insights:\n\n**Revenue and Growth**\n\n* Amazon's Q3 2023 revenue was $143.1 billion, up 11% year-over-year.\n* AWS revenue grew 12% year-over-year, with $919 million of incremental quarter-over-quarter revenue.\n* North America revenue was $87.9 billion, an increase of 11% year-over-year.\n* International revenue was $32.1 billion, an increase of 11% year-over-year, excluding foreign exchange.\n\n**Operating Income and Margin**\n\n* Amazon's Q3 2023 operating income was $11.2 billion, up 343% year-over-year.\n* North America operating income was $4.3 billion, an increase of $4.7 billion year-over-year, resulting in an operating margin of 4.9%, up 100 basis points quarter-over-quarter.\n* AWS operating income was $7 billion, an increase of $1.6 billion year-over-year, with an operating margin of 30.3%.\n\n**Free Cash Flow**\n\n* Trailing 12-month free cash flow adjusted for finance leases was $20.2 billion, an improvement of $41.7 billion year-over-year.\n* The largest driver of the improvement in free cash flow was increased operating income across all three segments.\n\n**Capital Investments**\n\n* Capital investments, defined as a combination of CapEx plus equipment finance leases, were $50 billion for the trailing 12-month period ended September 30, down from $60 billion in the comparable prior year period.\n* For the full year 2023, Amazon expects capital investments to be approximately $50 billion compared to $59 billion in 2022.\n\n**Guidance and Outlook**\n\n* Amazon is ready to make the holiday season a great one for customers, with inventory in the best position it's ever been heading into the holiday season.\n* The company continues to believe that putting customers first is the only reliable way to create lasting value for shareholders.\n\n**Key Takeaways**\n\n* Amazon's regional fulfillment network is exceeding expectations, with benefits including shorter transportation distances, faster delivery to customers, and increased purchase frequency by Prime members.\n* The company is seeing strong growth in everyday essentials and consumables, driven by faster delivery speeds.\n* AWS is seeing a stabilization of its year-over-year growth rate, with $919 million of incremental quarter-over-quarter revenue.\n* The company is optimistic about its generative AI business, with growth rates that compare", "topic": "dividend_value_defensive", "user_narrative": "**Name:** Jason Matthews\n**Age:** 30\n**Occupation:** IT Systems Administrator\n**Marital Status:** Married\n**Children:** None\nJason Matthews is a 30-year-old IT systems administrator who works for a mid-sized insurance company. He enjoys the stability of his job and appreciates the predictable nature of his day-to-day responsibilities. Jason is married, and though he and his spouse don\u2019t have children yet, they are planning to start a family in the next few years.\nWhile Jason is young, he\u2019s always been a cautious planner. He has a conservative approach to managing his finances and prefers strategies that offer steady, reliable returns over time. He\u2019s not the type to take big risks in pursuit of higher rewards. His financial goal is to create a portfolio that will generate stable income streams, so he can enjoy peace of mind knowing he\u2019s building for the long term.\nJason is drawn to investments in companies that are well-established, with a history of resilience. He tends to prioritize companies that are more likely to sustain their performance over time, regardless of market volatility. Additionally, Jason appreciates investments that offer regular payouts, as he sees this as a way to gradually enhance his financial position without needing to constantly monitor the market. Jason isn’t focused on any particular industry at this time. ", "label": 4}, {"ticker": "JPM", "sector": "Financial Services", "industry": "Banks - Diversified", "business_summary": "JPMorgan Chase & Co. operates as a financial services company worldwide. It operates through four segments: Consumer & Community Banking (CCB), Corporate & Investment Bank (CIB), Commercial Banking (CB), and Asset & Wealth Management (AWM). The CCB segment offers deposit, investment and lending products, cash management, and payments and services; mortgage origination and servicing activities; residential mortgages and home equity loans; and credit cards, auto loans, leases, and travel services to consumers and small businesses through bank branches, ATMs, and digital and telephone banking. The CIB segment provides investment banking products and services, including corporate strategy and structure advisory, and equity and debt market capital-raising services, as well as loan origination and syndication; payments; and cash and derivative instruments, risk management solutions, prime brokerage, and research. This segment also offers securities services, including custody, fund accounting and administration, and securities lending products for asset managers, insurance companies, and public and private investment funds. The CB segment provides financial solutions, including lending, payments, investment banking, and asset management to small and midsized companies, local governments, nonprofit clients, and large corporations, as well as investors, developers, and owners of multifamily, office, retail, industrial, and affordable housing properties. The AWM segment offers multi-asset investment management solutions in equities, fixed income, alternatives, and money market funds to institutional clients and retail investors; and retirement products and services, brokerage, custody, estate planning, lending, deposits, and investment management products to high net worth clients. JPMorgan Chase & Co. was founded in 1799 and is headquartered in New York, New York.", "beta": 1.102, "short_name": "JP Morgan Chase & Co.", "long_name": "JPMorgan Chase & Co.", "price_data": "2023 Monthly Stock Price: Jan: 134.54, Feb: 137.80, Mar: 125.26, Apr: 133.93, May: 131.48, Jun: 140.90, Jul: 154.08, Aug: 142.74, Sep: 141.46, Oct: 136.65, Nov: 153.37, Dec: 167.15", "earning_summary": "Based on the provided transcript, here's a detailed summary of the key financial metrics discussed during the Q3 2023 earnings call of JPMorgan Chase & Co.:\n\n**Key Financial Metrics:**\n\n1.  **Net Income:** $13.2 billion\n2.  **Earnings Per Share (EPS):** $4.33\n3.  **Revenue:** $40.7 billion\n4.  **Return on Tangible Common Equity (ROTC):** 22%\n5.  **Net Interest Income (NII):** $88.5 billion (2023 estimate)\n6.  **Net Interest Income ex-Markets:** $89 billion (2023 estimate)\n7.  **Adjusted Expense:** $84 billion (2023 estimate)\n8.  **Credit Costs:** $1.4 billion\n9.  **Net Charge-offs:** $720 million (year-over-year increase)\n10. **Net Reserve Build:** $49 million\n11. **Common Equity Tier 1 (CET1) Ratio:** 14.3% (up 50 basis points from the prior quarter)\n12. **Return on Equity (ROE):** 17% (natural return profile)\n13. **Return on Common Equity (ROCE):** 22% (ROTCE)\n14. **Net Investment Securities Losses:** $669 million\n15. **Firmwide Legal Expense:** $665 million\n\n**Business Segment Performance:**\n\n1.  **Consumer & Community Banking (CCB):** Net income of $5.3 billion, revenue of $17 billion (up 19% year-over-year)\n2.  **Banking & Wealth Management:** Revenue up 30% year-over-year, driven by higher NII on higher rates\n3.  **Card Services & Auto:** Revenue up 7% year-over-year, driven by higher Card Services NII on higher revolving balances\n4.  **Commercial Banking:** Net income of $1.7 billion, revenue of $3.7 billion (up 20% year-over-year)\n5.  **Investment Banking & Markets:** Revenue of $11.7 billion, down 3% year-over-year\n6.  **Asset & Wealth Management (AWM):** Net income of $1.1 billion, pretax margin of 31%\n7.  **Corporate:** Net income of $911 million, revenue of $1.5 billion (up $1.8 billion year-over-year)", "topic": "dividend_value_defensive", "user_narrative": "**Name:** Jason Matthews\n**Age:** 30\n**Occupation:** IT Systems Administrator\n**Marital Status:** Married\n**Children:** None\nJason Matthews is a 30-year-old IT systems administrator who works for a mid-sized insurance company. He enjoys the stability of his job and appreciates the predictable nature of his day-to-day responsibilities. Jason is married, and though he and his spouse don\u2019t have children yet, they are planning to start a family in the next few years.\nWhile Jason is young, he\u2019s always been a cautious planner. He has a conservative approach to managing his finances and prefers strategies that offer steady, reliable returns over time. He\u2019s not the type to take big risks in pursuit of higher rewards. His financial goal is to create a portfolio that will generate stable income streams, so he can enjoy peace of mind knowing he\u2019s building for the long term.\nJason is drawn to investments in companies that are well-established, with a history of resilience. He tends to prioritize companies that are more likely to sustain their performance over time, regardless of market volatility. Additionally, Jason appreciates investments that offer regular payouts, as he sees this as a way to gradually enhance his financial position without needing to constantly monitor the market. Jason isn’t focused on any particular industry at this time. ", "label": 3}, {"ticker": "KO", "sector": "Consumer Defensive", "industry": "Beverages - Non-Alcoholic", "business_summary": "The Coca-Cola Company, a beverage company, manufactures, markets, and sells various nonalcoholic beverages worldwide. The company provides sparkling soft drinks, sparkling flavors; water, sports, coffee, and tea; juice, value-added dairy, and plant-based beverages; and other beverages. It also offers beverage concentrates and syrups, as well as fountain syrups to fountain retailers, such as restaurants and convenience stores. The company sells its products under the Coca-Cola, Diet Coke/Coca-Cola Light, Coca-Cola Zero Sugar, caffeine free Diet Coke, Cherry Coke, Fanta Orange, Fanta Zero Orange, Fanta Zero Sugar, Fanta Apple, Sprite, Sprite Zero Sugar, Simply Orange, Simply Apple, Simply Grapefruit, Fresca, Schweppes, Thums Up, Aquarius, Ayataka, BODYARMOR, Ciel, Costa, Dasani, dogadan, FUZE TEA, Georgia, glac\u00e9au smartwater, glac\u00e9au vitaminwater, Gold Peak, Ice Dew, I LOHAS, Powerade, Topo Chico, AdeS, Del Valle, fairlife, innocent, Minute Maid, and Minute Maid Pulpy brands. It operates through a network of independent bottling partners, distributors, wholesalers, and retailers, as well as through bottling and distribution operators. The company was founded in 1886 and is headquartered in Atlanta, Georgia.", "beta": 0.608, "short_name": "Coca-Cola Company ", "long_name": "The Coca-Cola Company", "price_data": "2023 Monthly Stock Price: Jan: 58.52, Feb: 56.79, Mar: 59.65, Apr: 61.69, May: 57.37, Jun: 58.35, Jul: 60.01, Aug: 57.97, Sep: 54.67, Oct: 55.17, Nov: 57.53, Dec: 58.01", "earning_summary": "Based on the provided conference call transcript, here's a detailed summary of the key financial metrics discussed:\n\n**Revenue Growth:**\n\n* The company delivered 11% organic revenue growth in Q3 2023.\n* The revenue growth was driven by positive volume growth, pricing actions, and carryover pricing from the previous year.\n* The company expects to deliver 10% to 11% organic revenue growth for the full year 2023.\n\n**Volume Growth:**\n\n* The company delivered 2% unit case growth in Q3 2023.\n* The company expects to deliver positive volume growth for the full year 2023.\n\n**Price/Mix Growth:**\n\n* The company delivered 9% price/mix growth in Q3 2023, driven by pricing actions across operating segments and the impact of hyperinflationary markets.\n* The company expects price/mix growth to moderate in the fourth quarter as they cycle pricing initiatives from the previous year.\n\n**Gross Margin:**\n\n* The company's comparable gross margin expanded by approximately 130 basis points in Q3 2023, driven by underlying expansion and a slight benefit from bottler refranchising, partially offset by the impact of currency headwinds.\n\n**Operating Margin:**\n\n* The company's comparable operating margin expanded by approximately 20 basis points in Q3 2023, driven by strong top-line growth and the impact of refranchising bottling operations, partially offset by an increase in marketing investments and currency headwinds.\n\n**EPS Growth:**\n\n* The company delivered 7% year-over-year comparable EPS growth in Q3 2023, despite higher-than-expected 4% currency headwinds.\n* The company expects to deliver 13% to 14% comparable currency-neutral earnings per share growth for the full year 2023.\n\n**Free Cash Flow:**\n\n* The company generated approximately $7.9 billion in free cash flow year-to-date.\n* The company expects to generate approximately $9.5 billion in free cash flow for the full year 2023.\n\n**Balance Sheet:**\n\n* The company's net debt leverage is 1.5x EBITDA, below its target range of 2 to 2.5x.\n* The company has a strong balance sheet and expects to have increased flexibility to continue to reinvest in the business and return capital to shareholders.\n\n**Guidance:**\n\n* The company raised its 2023 guidance to 10% to 11% organic revenue growth and 13% to", "topic": "dividend_value_defensive", "user_narrative": "**Name:** Jason Matthews\n**Age:** 30\n**Occupation:** IT Systems Administrator\n**Marital Status:** Married\n**Children:** None\nJason Matthews is a 30-year-old IT systems administrator who works for a mid-sized insurance company. He enjoys the stability of his job and appreciates the predictable nature of his day-to-day responsibilities. Jason is married, and though he and his spouse don\u2019t have children yet, they are planning to start a family in the next few years.\nWhile Jason is young, he\u2019s always been a cautious planner. He has a conservative approach to managing his finances and prefers strategies that offer steady, reliable returns over time. He\u2019s not the type to take big risks in pursuit of higher rewards. His financial goal is to create a portfolio that will generate stable income streams, so he can enjoy peace of mind knowing he\u2019s building for the long term.\nJason is drawn to investments in companies that are well-established, with a history of resilience. He tends to prioritize companies that are more likely to sustain their performance over time, regardless of market volatility. Additionally, Jason appreciates investments that offer regular payouts, as he sees this as a way to gradually enhance his financial position without needing to constantly monitor the market. Jason isn’t focused on any particular industry at this time. ", "label": 1}, {"ticker": "WMT", "sector": "Consumer Defensive", "industry": "Discount Stores", "business_summary": "Walmart Inc. engages in the operation of retail, wholesale, other units, and eCommerce worldwide. The company operates through three segments: Walmart U.S., Walmart International, and Sam's Club. It operates supercenters, supermarkets, hypermarkets, warehouse clubs, cash and carry stores, and discount stores under Walmart and Walmart Neighborhood Market brands; membership-only warehouse clubs; ecommerce websites, such as walmart.com.mx, walmart.ca, flipkart.com, PhonePe and other sites; and mobile commerce applications. The company offers grocery and consumables, including dairy, meat, bakery, deli, produce, dry, chilled or frozen packaged foods, alcoholic and nonalcoholic beverages, floral, snack foods, candy, other grocery items, health and beauty aids, paper goods, laundry and home care, baby care, pet supplies, and other consumable items; fuel, tobacco and other categories. It is also involved in the provision of health and wellness products covering pharmacy, optical and hearing services, and over-the-counter drugs and other medical products; and home and apparel including home improvement, outdoor living, gardening, furniture, apparel, jewelry, tools and power equipment, housewares, toys, seasonal items, mattresses and tire and battery centers. In addition, the company offers consumer electronics and accessories, software, video games, office supplies, appliances, and third-party gift cards. Further, it operates digital payment platforms; and offers financial services and related products, including money transfers, bill payments, money orders, check cashing, prepaid access, co-branded credit cards, installment lending, and earned wage access. Additionally, the company markets lines of merchandise under private brands, including Allswell, Athletic Works, Equate, and Free Assembly. The company was formerly known as Wal-Mart Stores, Inc. and changed its name to Walmart Inc. in February 2018. Walmart Inc. was founded in 1945 and is based in Bentonville, Arkansas.", "beta": 0.516, "short_name": "Walmart Inc.", "long_name": "Walmart Inc.", "price_data": "2023 Monthly Stock Price: Jan: 46.78, Feb: 46.21, Mar: 48.14, Apr: 49.29, May: 48.13, Jun: 51.51, Jul: 52.39, Aug: 53.48, Sep: 52.60, Oct: 53.74, Nov: 51.21, Dec: 52.04", "earning_summary": "Here's a detailed summary of the key financial metrics discussed during the Walmart Q3 2024 earnings conference call:\n\n**Revenue and Sales Growth**\n\n* Total revenue grew 4.4% in constant currency, or $7 billion, year-over-year.\n* Walmart U.S. comp sales increased 4.9%, while Sam's Club U.S. comp sales grew 3.8% (excluding fuel).\n* International sales grew 5.4% in constant currency, with Walmex sales up 9% and China sales up 25%.\n* E-commerce sales grew 24% in Walmart U.S., 16% in Sam's Club U.S., and 15% globally.\n\n**Gross Margin**\n\n* Gross margin expanded 32 basis points, driven by the timing shift of Big Billion Days in India and lapping last year's LIFO charge at Sam's Club U.S.\n* Walmart U.S. gross margin increased 5 basis points, reflecting lower markdowns and supply chain costs.\n\n**Operating Income and Expenses**\n\n* Adjusted operating income grew 3%, including a 270 basis point currency tailwind.\n* SG&A expenses deleveraged 37 basis points on an adjusted basis, impacted by higher year-over-year wage-related costs and store remodel costs.\n* Legal expenses increased, primarily due to a $70 million to $75 million accrual related to prior periods.\n\n**Return on Investment (ROI)**\n\n* ROI improved 130 basis points to 14.1% over the last 12 months, driven by lapping last year's Q3 charge related to the opioid legal settlement framework and productivity initiatives.\n* The company expects ROI to increase over the coming years.\n\n**Guidance**\n\n* The company raised its full-year sales guidance to 5% to 5.5% from 4% to 4.5% previously.\n* Operating income guidance remains at 7% to 7.5% growth.\n* EPS guidance was raised to $6.40 to $6.48.\n* The company expects merchandise mix pressure to continue in Q4, with grocery and health and wellness sales rates outpacing general merchandise.\n\n**E-commerce and Marketplace Growth**\n\n* E-commerce sales grew 24% in Walmart U.S., 16% in Sam's Club U.S., and 15% globally.\n* Marketplace sales grew 16% in Walmex, 16% in Canada, and 38% in China.\n* The company has more than doubled the number of items available to", "topic": "dividend_value_defensive", "user_narrative": "**Name:** Jason Matthews\n**Age:** 30\n**Occupation:** IT Systems Administrator\n**Marital Status:** Married\n**Children:** None\nJason Matthews is a 30-year-old IT systems administrator who works for a mid-sized insurance company. He enjoys the stability of his job and appreciates the predictable nature of his day-to-day responsibilities. Jason is married, and though he and his spouse don\u2019t have children yet, they are planning to start a family in the next few years.\nWhile Jason is young, he\u2019s always been a cautious planner. He has a conservative approach to managing his finances and prefers strategies that offer steady, reliable returns over time. He\u2019s not the type to take big risks in pursuit of higher rewards. His financial goal is to create a portfolio that will generate stable income streams, so he can enjoy peace of mind knowing he\u2019s building for the long term.\nJason is drawn to investments in companies that are well-established, with a history of resilience. He tends to prioritize companies that are more likely to sustain their performance over time, regardless of market volatility. Additionally, Jason appreciates investments that offer regular payouts, as he sees this as a way to gradually enhance his financial position without needing to constantly monitor the market. Jason isn’t focused on any particular industry at this time. ", "label": 2}]}
+{"topic": "nondividend_value_cyclical", "data": [{"ticker": "AAPL", "sector": "Technology", "industry": "Consumer Electronics", "business_summary": "Apple Inc. designs, manufactures, and markets smartphones, personal computers, tablets, wearables, and accessories worldwide. The company offers iPhone, a line of smartphones; Mac, a line of personal computers; iPad, a line of multi-purpose tablets; and wearables, home, and accessories comprising AirPods, Apple TV, Apple Watch, Beats products, and HomePod. It also provides AppleCare support and cloud services; and operates various platforms, including the App Store that allow customers to discover and download applications and digital content, such as books, music, video, games, and podcasts. In addition, the company offers various services, such as Apple Arcade, a game subscription service; Apple Fitness+, a personalized fitness service; Apple Music, which offers users a curated listening experience with on-demand radio stations; Apple News+, a subscription news and magazine service; Apple TV+, which offers exclusive original content; Apple Card, a co-branded credit card; and Apple Pay, a cashless payment service, as well as licenses its intellectual property. The company serves consumers, and small and mid-sized businesses; and the education, enterprise, and government markets. It distributes third-party applications for its products through the App Store. The company also sells its products through its retail and online stores, and direct sales force; and third-party cellular network carriers, wholesalers, retailers, and resellers. Apple Inc. was founded in 1976 and is headquartered in Cupertino, California.", "beta": 1.239, "short_name": "Apple Inc.", "long_name": "Apple Inc.", "price_data": "2023 Monthly Stock Price: Jan: 142.95, Feb: 146.26, Mar: 163.61, Apr: 168.36, May: 176.11, Jun: 192.72, Jul: 195.19, Aug: 186.91, Sep: 170.34, Oct: 169.90, Nov: 189.23, Dec: 191.80", "earning_summary": "Based on the provided conference call transcript, here's a detailed summary of the key financial metrics discussed:\n\n1.  **Revenue**: Apple reported revenue of $89.5 billion for the September quarter, a decrease of less than 1% from the same period last year. On a constant-currency basis, revenue grew year-over-year in total and in each geographic segment.\n2.  **iPhone Revenue**: iPhone revenue came in at $43.8 billion, a 3% increase from the same period last year and a new September quarter record. The company set an all-time revenue record in India and September quarter records in several countries, including Brazil, Canada, France, Indonesia, Mexico, the Philippines, Saudi Arabia, Turkey, the UAE, Vietnam, and more.\n3.  **Services Revenue**: Services revenue set an all-time record of $22.3 billion, a 16% year-over-year increase. The company achieved all-time revenue records across App Store, advertising, AppleCare, iCloud, payment services, and video, as well as a September quarter revenue record in Apple Music.\n4.  **Gross Margin**: Company gross margin set a September quarter record at 45.2%, up 70 basis points sequentially, driven by leverage and favorable mix, partially offset by foreign exchange. Products gross margin was 36.6%, up 120 basis points sequentially, also driven by leverage and mix, partially offset by foreign exchange. Services gross margin was 70.9%, up 40 basis points from last quarter due to a different mix.\n5.  **Operating Expenses**: Operating expenses of $13.5 billion were at the low end of the guidance range, up 2% year-over-year.\n6.  **Net Income**: Net income was $23 billion, and diluted earnings per share was $1.46, up 13% versus last year and a September quarter record.\n7.  **Operating Cash Flow**: Operating cash flow was strong at $21.6 billion.\n8.  **Capital Return Program**: The company returned nearly $25 billion to shareholders, including $3.8 billion in dividends and equivalents and $15.5 billion through open market repurchases of 85 million Apple shares.\n9.  **Guidance**: For the December quarter, the company expects:\n\t* Revenue to be similar to last year, despite having one less week this year.\n\t* iPhone revenue to grow year-over-year on an absolute basis.\n\t* Mac year-over-year performance to significantly accelerate from", "topic": "nondividend_value_cyclical", "user_narrative": "**Name:** Malik Johnson\n**Age:** 25\n**Occupation:** Software Developer\n**Marital Status:** Single\n**Children:** None\nMalik Johnson is a 25-year-old software developer working at a growing tech startup. His background in engineering has given him a methodical approach to problem-solving, which he also applies to his personal finances. Being single with no children allows him the flexibility to focus on building his career and making strategic financial decisions aligned with his long-term goals.\nAt this stage, he isn\u2019t particularly interested in receiving dividends from his investments. Instead, his focus is on identifying undervalued companies with strong long-term potential. Malik stays informed about market trends and enjoys researching sectors that perform well during periods of economic growth. He prefers to invest in businesses well-positioned to take advantage of economic cycles, even if that means accepting some short-term volatility. His goal is to build wealth by capitalizing on companies that will benefit from economic upturns, rather than chasing short-term gains. He isn’t focused on any particular industry at this time.", "label": 4}, {"ticker": "PG", "sector": "Consumer Defensive", "industry": "Household & Personal Products", "business_summary": "The Procter & Gamble Company engages in the provision of branded consumer packaged goods worldwide. The company operates through five segments: Beauty; Grooming; Health Care; Fabric & Home Care; and Baby, Feminine & Family Care. The Beauty segment offers conditioners, shampoos, styling aids, and treatments under the Head & Shoulders, Herbal Essences, Pantene, and Rejoice brands; and antiperspirants and deodorants, personal cleansing, and skin care products under the Olay, Old Spice, Safeguard, Secret, SK-II, and Native brands. The Grooming segment provides blades and razors, shave products, appliances, and other grooming products under the Braun, Gillette, and Venus brand names. The Health Care segment offers toothbrushes, toothpastes, and other oral care products under the Crest and Oral-B brand names; and gastrointestinal, pain relief, rapid diagnostics, respiratory, vitamins/minerals/supplements, and other personal health care products under Metamucil, Neurobion, Pepto-Bismol, and Vicks brands. The Fabric & Home Care segment provides fabric enhancers, laundry additives, and laundry detergents under the Ariel, Downy, Gain, and Tide brands; and air care, dish care, P&G professional, and surface care products under the Cascade, Dawn, Fairy, Febreze, Mr. Clean, and Swiffer brands. The Baby, Feminine & Family Care segment offers baby wipes, and taped diapers and pants under the Luvs and Pampers brands; adult incontinence and feminine care products under the Always, Always Discreet, and Tampax brands; and paper towels, tissues, and toilet papers under the Bounty, Charmin, and Puffs brands. It sells its products primarily through mass merchandisers, e-commerce, grocery stores, membership club stores, drug stores, department stores, distributors, wholesalers, specialty beauty stores, high-frequency stores, pharmacies, electronics stores, and professional channels, as well as directly to consumers. The company was founded in 1837 and is headquartered in Cincinnati, Ohio.", "beta": 0.407, "short_name": "Procter & Gamble Company ", "long_name": "The Procter & Gamble Company", "price_data": "2023 Monthly Stock Price: Jan: 137.13, Feb: 132.49, Mar: 143.21, Apr: 151.56, May: 138.11, Jun: 147.06, Jul: 152.44, Aug: 150.53, Sep: 142.26, Oct: 147.25, Nov: 150.67, Dec: 143.82", "earning_summary": "**Summary of Key Financial Metrics:**\n\n1.  **Organic Sales Growth:** 7% in Q1 2024, with a guidance range of 4% to 5% for the fiscal year.\n2.  **Pricing Contribution:** 7 points to sales growth in Q1 2024, expected to decrease by 3 to 4 points in Q2 and Q3.\n3.  **Volume Growth:** Modest volume growth outside of China, with a decline of 6% in Greater China.\n4.  **Core Earnings Per Share (EPS):** $1.83 in Q1 2024, up 17% year-over-year, with a guidance range of 6% to 9% growth for the fiscal year.\n5.  **Core Operating Margin:** Increased by 240 basis points in Q1 2024, with a currency-neutral increase of 340 basis points.\n6.  **Adjusted Free Cash Flow Productivity:** 97% in Q1 2024.\n7.  **Cash Return to Share Owners:** $3.8 billion in Q1 2024, with a plan to return $14 billion to $15 billion of cash to shareholders this fiscal year.\n8.  **Commodity Costs:** Expected to be a tailwind of around $800 million after tax in fiscal '24, with a headwind of approximately $1 billion after tax due to foreign exchange rates.\n9.  **Foreign Exchange (FX) Impact:** A headwind of approximately $1 billion after tax, with a 7-point EPS impact from FX.\n10. **Guidance Ranges:** Organic sales growth of 4% to 5%, core EPS growth of 6% to 9%, cash productivity of 90%, and cash return to share owners of $14 billion to $15 billion.\n\n**Key Takeaways:**\n\n*   Procter & Gamble's Q1 2024 results were strong, with 7% organic sales growth and 17% core EPS growth.\n*   The company expects a normalization in underlying market growth rate to around 4% for the fiscal year.\n*   Pricing will start to lap in Q2, with a 3 to 4 point decrease in price contribution.\n*   Volume growth is expected to progress sequentially, with a focus on driving wholesale penetration and creating volume growth.\n*   The company is committed to investing in superiority, productivity, and innovation to drive growth and value creation.\n*   Procter &", "topic": "nondividend_value_cyclical", "user_narrative": "**Name:** Malik Johnson\n**Age:** 25\n**Occupation:** Software Developer\n**Marital Status:** Single\n**Children:** None\nMalik Johnson is a 25-year-old software developer working at a growing tech startup. His background in engineering has given him a methodical approach to problem-solving, which he also applies to his personal finances. Being single with no children allows him the flexibility to focus on building his career and making strategic financial decisions aligned with his long-term goals.\nAt this stage, he isn\u2019t particularly interested in receiving dividends from his investments. Instead, his focus is on identifying undervalued companies with strong long-term potential. Malik stays informed about market trends and enjoys researching sectors that perform well during periods of economic growth. He prefers to invest in businesses well-positioned to take advantage of economic cycles, even if that means accepting some short-term volatility. His goal is to build wealth by capitalizing on companies that will benefit from economic upturns, rather than chasing short-term gains. He isn’t focused on any particular industry at this time.", "label": 3}, {"ticker": "TSLA", "sector": "Consumer Cyclical", "industry": "Auto Manufacturers", "business_summary": "Tesla, Inc. designs, develops, manufactures, leases, and sells electric vehicles, and energy generation and storage systems in the United States, China, and internationally. The company operates in two segments, Automotive, and Energy Generation and Storage. The Automotive segment offers electric vehicles, as well as sells automotive regulatory credits; and non-warranty after-sales vehicle, used vehicles, body shop and parts, supercharging, retail merchandise, and vehicle insurance services. This segment also provides sedans and sport utility vehicles through direct and used vehicle sales, a network of Tesla Superchargers, and in-app upgrades; purchase financing and leasing services; services for electric vehicles through its company-owned service locations and Tesla mobile service technicians; and vehicle limited warranties and extended service plans. The Energy Generation and Storage segment engages in the design, manufacture, installation, sale, and leasing of solar energy generation and energy storage products, and related services to residential, commercial, and industrial customers and utilities through its website, stores, and galleries, as well as through a network of channel partners; and provision of service and repairs to its energy product customers, including under warranty, as well as various financing options to its solar customers. The company was formerly known as Tesla Motors, Inc. and changed its name to Tesla, Inc. in February 2017. Tesla, Inc. was incorporated in 2003 and is headquartered in Austin, Texas.", "beta": 2.297, "short_name": "Tesla, Inc.", "long_name": "Tesla, Inc.", "price_data": "2023 Monthly Stock Price: Jan: 173.22, Feb: 205.71, Mar: 207.46, Apr: 164.31, May: 203.93, Jun: 261.77, Jul: 267.43, Aug: 258.08, Sep: 250.22, Oct: 200.84, Nov: 240.08, Dec: 248.48", "earning_summary": "**Summary Report: Tesla, Inc. Q3 2023 Earnings Conference Call**\n\n**Key Financial Metrics:**\n\n1.  **Vehicle Deliveries:** Tesla expects to deliver 1.8 million vehicles in 2023, with a growth rate of 28% in 2024, assuming 2.3 million deliveries.\n2.  **Cost per Vehicle:** The cost per vehicle decreased to approximately $37,500 in Q3 2023, with a sequential decrease in material cost and freight.\n3.  **Gross Margin:** The company aims to maintain or exceed the trend of cost reduction efforts in 2024, with a focus on engineering, factory operations, and supply chain improvements.\n4.  **Energy Storage:** The energy division is becoming the company's highest-margin business, with 4 gigawatt hours of energy storage products deployed in Q3 2023.\n5.  **Cybertruck:** The company expects to deliver around 250,000 Cybertrucks in 2025, with a significant ramp-up in production, but acknowledges that reaching volume production and cash flow positivity will take time.\n6.  **4680 Cell:** Production in Texas increased 40% quarter-over-quarter, with a focus on quality and scrap reduction.\n7.  **Gigafactory Mexico:** The company is laying the groundwork for construction, but is cautious about the high-interest rate environment and its impact on car affordability.\n8.  **Robotaxi:** The company is making progress with autonomy, with the end-to-end AI system driving around Austin with no interventions.\n9.  **FSD Pricing:** The company plans to make FSD more affordable as it improves, with a temporary low price point, and expects to increase the price as the technology improves.\n10. **Gross Margin Evolution:** The company expects to see a sequential benefit from production ramping at Berlin and Austin, but acknowledges that there will be headwinds from the ramp-up of Cybertruck production.\n\n**Key Takeaways:**\n\n1.  Tesla is focused on reducing costs, maximizing delivery volumes, and investing in the future, particularly in AI and next-generation platforms.\n2.  The company is cautious about the high-interest rate environment and its impact on car affordability.\n3.  Tesla is making progress with autonomy, with the end-to-end AI system driving around Austin with no interventions.\n4.  The company plans to make FSD more affordable as it improves, with a temporary low price point.\n5.  Tesla is focused", "topic": "nondividend_value_cyclical", "user_narrative": "**Name:** Malik Johnson\n**Age:** 25\n**Occupation:** Software Developer\n**Marital Status:** Single\n**Children:** None\nMalik Johnson is a 25-year-old software developer working at a growing tech startup. His background in engineering has given him a methodical approach to problem-solving, which he also applies to his personal finances. Being single with no children allows him the flexibility to focus on building his career and making strategic financial decisions aligned with his long-term goals.\nAt this stage, he isn\u2019t particularly interested in receiving dividends from his investments. Instead, his focus is on identifying undervalued companies with strong long-term potential. Malik stays informed about market trends and enjoys researching sectors that perform well during periods of economic growth. He prefers to invest in businesses well-positioned to take advantage of economic cycles, even if that means accepting some short-term volatility. His goal is to build wealth by capitalizing on companies that will benefit from economic upturns, rather than chasing short-term gains. He isn’t focused on any particular industry at this time.", "label": 2}, {"ticker": "BAC", "sector": "Financial Services", "industry": "Banks - Diversified", "business_summary": "Bank of America Corporation, through its subsidiaries, provides banking and financial products and services for individual consumers, small and middle-market businesses, institutional investors, large corporations, and governments worldwide. It operates in four segments: Consumer Banking, Global Wealth & Investment Management (GWIM), Global Banking, and Global Markets. The Consumer Banking segment offers traditional and money market savings accounts, certificates of deposit and IRAs, non-interest and interest-bearing checking accounts, and investment accounts and products; credit and debit cards; residential mortgages, and home equity loans; and direct and indirect loans, such as automotive, recreational vehicle, and consumer personal loans. The GWIM segment provides investment management, brokerage, banking, and trust and retirement products and services; wealth management solutions; and customized solutions, including specialty asset management services. The Global Banking segment offers lending products and services, including commercial loans, leases, commitment facilities, trade finance, and commercial real estate and asset-based lending; treasury solutions, such as treasury management, foreign exchange, short-term investing options, and merchant services; working capital management solutions; debt and equity underwriting and distribution, and merger-related and other advisory services; and fixed-income and equity research, and certain market-based services. The Global Markets segment provides market-making, financing, securities clearing, settlement, and custody services; securities and derivative products; and risk management products using interest rate, equity, credit, currency and commodity derivatives, foreign exchange, fixed-income, and mortgage-related products. Bank of America Corporation was founded in 1784 and is based in Charlotte, North Carolina.", "beta": 1.338, "short_name": "Bank of America Corporation", "long_name": "Bank of America Corporation", "price_data": "2023 Monthly Stock Price: Jan: 33.96, Feb: 32.83, Mar: 27.55, Apr: 28.21, May: 26.77, Jun: 27.86, Jul: 31.08, Aug: 28.07, Sep: 26.81, Oct: 25.79, Nov: 30.09, Dec: 33.23", "earning_summary": "Based on the provided transcript, here's a summary of the key financial metrics discussed during the Bank of America Corporation's Q3 2023 earnings call:\n\n1.  **Net Income**: $7.8 billion, a 10% increase from the year-ago quarter.\n2.  **Return on Tangible Common Equity (ROTC)**: Over 15%, indicating strong profitability.\n3.  **Net Interest Income (NII)**: $14.5 billion, a 4% increase from the year-ago quarter and above the guided range of $14.2 billion to $14.3 billion.\n4.  **Expense**: $15.8 billion, a decline of $200 million from the previous quarter, and expected to decline further to $15.6 billion in the fourth quarter.\n5.  **Provision Expense**: $1.2 billion, reflecting a macroeconomic outlook with an unemployment rate rising to over 5% in 2024.\n6.  **Credit Quality Metrics**: Consumer delinquencies remain below historical averages, and commercial net charge-offs declined from the previous quarter.\n7.  **Asset Sensitivity**: A 100 basis point parallel shift in the forward yield curve is expected to result in a $3.1 billion NII benefit over the next 12 months.\n8.  **Capital**: The bank has more than $30 billion of excess capital, and the proposed capital rules would require an additional $195 billion of total capital, which the bank believes it can meet.\n9.  **Return on Assets (ROA)**: 1%, indicating a relatively low return on assets.\n10. **Dividend**: A 9% dividend increase, with $2.9 billion returned to shareholders in the quarter.\n11. **Tangible Book Value per Share**: Up 12% year-over-year.\n12. **CET1 Ratio**: Improved to 11.9%, well above the current 9.5% requirement.\n13. **Supplemental Leverage Ratio**: 62%, well above the minimum requirement of 5%.\n14. **LCR Ratios**: Remain well above minimums for BAC metrics and stronger at the bank level.\n15. **Loan Growth**: Slowed in the quarter due to a decline in demand for commercial borrowing and lower revolver utilization.\n16. **Deposit Growth**: Average deposits are up 33% from pre-pandemic levels, with consumer deposits up 36% and consumer checking up 45%.\n17. **Ex", "topic": "nondividend_value_cyclical", "user_narrative": "**Name:** Malik Johnson\n**Age:** 25\n**Occupation:** Software Developer\n**Marital Status:** Single\n**Children:** None\nMalik Johnson is a 25-year-old software developer working at a growing tech startup. His background in engineering has given him a methodical approach to problem-solving, which he also applies to his personal finances. Being single with no children allows him the flexibility to focus on building his career and making strategic financial decisions aligned with his long-term goals.\nAt this stage, he isn\u2019t particularly interested in receiving dividends from his investments. Instead, his focus is on identifying undervalued companies with strong long-term potential. Malik stays informed about market trends and enjoys researching sectors that perform well during periods of economic growth. He prefers to invest in businesses well-positioned to take advantage of economic cycles, even if that means accepting some short-term volatility. His goal is to build wealth by capitalizing on companies that will benefit from economic upturns, rather than chasing short-term gains. He isn’t focused on any particular industry at this time.", "label": 1}]}

data/single_stock_data/single_stock_demo.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

dum.txt ADDED Viewed

	@@ -0,0 +1,352 @@

+absl-py==1.3.0
+accelerate==0.31.0
+aiofiles==23.2.1
+aiohappyeyeballs==2.4.3
+aiohttp==3.10.8
+aiosignal==1.2.0
+alembic==1.8.1
+annotated-types==0.6.0
+anyio==3.6.2
+appdirs==1.4.4
+argon2-cffi==21.3.0
+argon2-cffi-bindings==21.2.0
+asttokens==2.0.5
+astunparse==1.6.3
+async-timeout==4.0.2
+attrs==21.4.0
+autopage==0.5.1
+backcall==0.2.0
+beautifulsoup4==4.11.1
+black==22.8.0
+bleach==6.0.0
+blis==0.7.11
+cachetools==5.2.0
+catalogue==2.0.10
+cbor==1.0.0
+certifi==2022.6.15
+cffi==1.15.1
+charset-normalizer==2.1.0
+chest==0.2.3
+click==8.1.7
+cliff==4.1.0
+cloudpathlib==0.18.1
+cloudpickle==2.2.1
+cmaes==0.9.1
+cmake==3.29.0.1
+cmd2==2.4.2
+colorama==0.4.4
+coloredlogs==15.0.1
+colorlog==4.7.2
+comm==0.2.2
+confection==0.1.5
+cryptography==39.0.0
+cwl-eval==1.0.12
+cycler==0.11.0
+cymem==2.0.8
+Cython==3.0.10
+datasets==2.3.2
+debugpy==1.6.2
+decorator==5.1.1
+defusedxml==0.7.1
+Deprecated==1.2.14
+dill==0.3.5.1
+distlib==0.3.6
+distro==1.9.0
+easydict==1.13
+entrypoints==0.4
+et-xmlfile==1.1.0
+eval_type_backport==0.2.0
+executing==0.8.3
+faiss-cpu==1.8.0.post1
+fastapi==0.112.1
+fastjsonschema==2.16.2
+ffmpy==0.4.0
+filelock==3.16.1
+flake8==5.0.4
+flatbuffers==23.3.3
+fonttools==4.34.4
+frozendict==2.3.4
+frozenlist==1.3.0
+fsspec==2024.6.0
+fugashi==1.1.2
+gast==0.4.0
+gdown==5.2.0
+google-auth==2.15.0
+google-auth-oauthlib==1.0.0
+google-pasta==0.2.0
+gradio==4.41.0
+gradio_client==1.3.0
+greenlet==2.0.1
+grpcio==1.51.1
+h11==0.14.0
+h5py==3.8.0
+HeapDict==1.0.1
+html5lib==1.1
+httpcore==1.0.2
+httpx==0.26.0
+huggingface-hub==0.24.2
+humanfriendly==10.0
+idna==3.3
+ijson==3.3.0
+implicit==0.6.2
+importlib-metadata==4.13.0
+importlib-resources==5.10.1
+inscriptis==2.5.0
+ipadic==1.0.0
+ipdb==0.13.13
+ipykernel==6.15.1
+ipython==8.4.0
+ipython-genutils==0.2.0
+ipywidgets==8.1.3
+ir-measures==0.3.3
+ir_datasets==0.5.8
+japanize-matplotlib==1.1.3
+jax==0.4.8
+jedi==0.18.1
+Jinja2==3.1.2
+joblib==1.1.0
+jsonschema==4.17.3
+jupyter==1.0.0
+jupyter-client==7.3.4
+jupyter-console==6.6.3
+jupyter-core==4.11.1
+jupyter-events==0.6.3
+jupyter_server==2.5.0
+jupyter_server_terminals==0.4.4
+jupyterlab-pygments==0.2.2
+jupyterlab_widgets==3.0.11
+kaleido==0.2.1
+keras==2.12.0
+kiwisolver==1.4.4
+krippendorff==0.6.0
+langcodes==3.4.0
+language_data==1.2.0
+libclang==16.0.0
+lightgbm==4.4.0
+lit==18.1.2
+llvmlite==0.39.1
+lxml==5.3.0
+lz4==4.3.3
+Mako==1.2.4
+marisa-trie==1.2.0
+Markdown==3.4.1
+markdown-it-py==3.0.0
+MarkupSafe==2.1.1
+matchpy==0.5.5
+matplotlib==3.5.2
+matplotlib-inline==0.1.3
+mccabe==0.7.0
+mdurl==0.1.2
+mecab==0.996.3
+mistune==2.0.5
+ml-dtypes==0.1.0
+ml-metrics==0.1.4
+more-itertools==10.4.0
+mpmath==1.3.0
+msgpack==1.0.4
+multidict==6.0.2
+multiprocess==0.70.13
+multiset==2.1.1
+multitasking==0.0.11
+murmurhash==1.0.10
+mypy==0.971
+mypy-extensions==0.4.3
+nbclassic==0.5.3
+nbclient==0.7.2
+nbconvert==7.2.10
+nbformat==5.7.3
+nest-asyncio==1.5.5
+networkx==2.8.5
+nltk==3.8.1
+nmslib==2.1.1
+notebook==6.5.3
+notebook_shim==0.2.2
+nptyping==1.4.4
+numba==0.56.4
+numpy==1.24.4
+nvidia-cublas-cu11==11.10.3.66
+nvidia-cublas-cu12==12.1.3.1
+nvidia-cuda-cupti-cu11==11.7.101
+nvidia-cuda-cupti-cu12==12.1.105
+nvidia-cuda-nvrtc-cu11==11.7.99
+nvidia-cuda-nvrtc-cu12==12.1.105
+nvidia-cuda-runtime-cu11==11.7.99
+nvidia-cuda-runtime-cu12==12.1.105
+nvidia-cudnn-cu11==8.5.0.96
+nvidia-cudnn-cu12==8.9.2.26
+nvidia-cufft-cu11==10.9.0.58
+nvidia-cufft-cu12==11.0.2.54
+nvidia-curand-cu11==10.2.10.91
+nvidia-curand-cu12==10.3.2.106
+nvidia-cusolver-cu11==11.4.0.1
+nvidia-cusolver-cu12==11.4.5.107
+nvidia-cusparse-cu11==11.7.4.91
+nvidia-cusparse-cu12==12.1.0.106
+nvidia-nccl-cu11==2.14.3
+nvidia-nccl-cu12==2.18.1
+nvidia-nvjitlink-cu12==12.4.127
+nvidia-nvtx-cu11==11.7.91
+nvidia-nvtx-cu12==12.1.105
+oauthlib==3.2.2
+onnxruntime==1.18.0
+openai==1.12.0
+openpyxl==3.0.10
+opt-einsum==3.3.0
+optuna==3.1.1
+orjson==3.10.7
+packaging==21.3
+pandarallel==1.6.4
+pandas==1.4.3
+pandas-datareader==0.10.0
+pandocfilters==1.5.0
+parso==0.8.3
+pathspec==0.10.1
+patsy==0.5.3
+pbr==5.11.0
+peewee==3.17.6
+pexpect==4.8.0
+pickleshare==0.7.5
+pillow==10.4.0
+pkgutil_resolve_name==1.3.10
+plac==1.3.5
+platformdirs==2.5.2
+plotly==5.13.0
+preshed==3.0.9
+prettytable==3.5.0
+prometheus-client==0.16.0
+prompt-toolkit==3.0.30
+protobuf==3.20.0
+psutil==5.9.1
+ptyprocess==0.7.0
+pure-eval==0.2.2
+pyarrow==17.0.0
+pyasn1==0.4.8
+pyasn1-modules==0.2.8
+pybind11==2.6.1
+pycodestyle==2.9.1
+pycparser==2.21
+pydantic==2.9.2
+pydantic_core==2.23.4
+pydub==0.25.1
+pyflakes==2.5.0
+Pygments==2.18.0
+pyjnius==1.6.1
+pyknp==0.6.1
+pyparsing==3.0.9
+pyperclip==1.8.2
+pyrsistent==0.19.3
+pyserini==0.22.1
+PySocks==1.7.1
+pyterrier-t5 @ git+https://github.com/terrierteam/pyterrier_t5.git@679e3320b0f7c997de108bc44f66ef15fba72f08
+python-dateutil==2.8.2
+python-json-logger==2.0.7
+python-multipart==0.0.9
+python-terrier==0.10.1
+pytrec-eval-terrier==0.5.6
+pytz==2022.7
+PyYAML==6.0
+pyzmq==23.2.0
+qtconsole==5.4.1
+QtPy==2.3.0
+ray==2.2.0
+recbole==1.1.1
+regex==2022.7.9
+requests==2.32.3
+requests-oauthlib==1.3.1
+responses==0.18.0
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rich==13.9.1
+rsa==4.9
+ruff==0.6.1
+safetensors==0.4.3
+scikit-learn==1.1.2
+scipy==1.8.1
+seaborn==0.12.1
+semantic-version==2.10.0
+Send2Trash==1.8.0
+sentence-transformers==3.0.1
+sentencepiece==0.1.96
+shap==0.41.0
+shellingham==1.5.4
+six==1.16.0
+slicer==0.0.7
+smart-open==7.0.4
+sniffio==1.3.0
+soupsieve==2.3.2.post1
+spacy==3.7.5
+spacy-legacy==3.0.12
+spacy-loggers==1.0.5
+SQLAlchemy==1.4.45
+srsly==2.4.8
+stack-data==0.3.0
+starlette==0.38.2
+statsmodels==0.13.5
+stevedore==4.1.1
+sympy==1.12
+TA-Lib==0.4.25
+tabulate==0.9.0
+tenacity==8.1.0
+tensorboard==2.12.1
+tensorboard-data-server==0.7.0
+tensorboard-plugin-wit==1.8.1
+tensorboardX==2.5.1
+tensorflow==2.12.0
+tensorflow-estimator==2.12.0
+tensorflow-io-gcs-filesystem==0.32.0
+termcolor==2.2.0
+terminado==0.17.1
+thinc==8.2.5
+thop==0.1.1.post2209072238
+threadpoolctl==3.1.0
+tiktoken==0.6.0
+tinycss2==1.2.1
+together==1.3.0
+tokenizers==0.19.1
+tomli==2.0.1
+tomlkit==0.12.0
+torch==1.13.1
+torch-cluster==1.6.0
+torch-geometric==2.0.4
+torch-scatter==2.0.9
+torch-sparse==0.6.14
+torch-spline-conv==1.2.1
+torch-tb-profiler==0.4.0
+torchaudio==0.13.1
+torchinfo==1.7.1
+torchsummary==1.5.1
+torchvision==0.14.1
+tornado==6.2
+tqdm==4.66.5
+traitlets==5.3.0
+transformers==4.44.1
+trec-car-tools==2.6
+triton==2.1.0
+typer==0.12.3
+typing_extensions==4.9.0
+typish==1.9.3
+unidic==1.1.0
+unidic-lite==1.0.8
+unlzw3==0.2.2
+urllib3==2.2.2
+uvicorn==0.30.6
+virtualenv==20.18.0
+warc3-wet==0.2.5
+warc3-wet-clueweb09==0.2.5
+wasabi==0.9.1
+wcwidth==0.2.5
+weasel==0.4.1
+webencodings==0.5.1
+websocket-client==1.5.1
+websockets==12.0
+Werkzeug==2.2.2
+wget==3.2
+widgetsnbextension==4.0.11
+wrapt==1.14.1
+xlrd==2.0.1
+xlwt==1.3.0
+xxhash==3.0.0
+yarl==1.13.1
+yfinance==0.2.42
+zipp==3.11.0
+zlib-state==0.1.6

experiments/experiment_with_api_without_personalization.py ADDED Viewed

	@@ -0,0 +1,665 @@

+import subprocess
+import sys
+import os
+ROOT_FILE = os.path.join(os.path.dirname(os.path.abspath(__file__)), "../")
+sys.path.append(ROOT_FILE)
+from components.induce_personality import construct_big_five_words
+# need to import: gradio
+def install(package, upgrade=False):
+    if upgrade:
+        subprocess.run(
+            [
+                sys.executable,
+                "-m",
+                "pip",
+                "install",
+                "--upgrade",
+                package,
+            ],
+            check=True,
+        )
+    else:
+        subprocess.run(
+            [
+                sys.executable,
+                "-m",
+                "pip",
+                "install",
+                package,
+            ],
+            check=True,
+        )
+# install("ipdb")
+# install("gradio")
+# install("sentence-transformers")
+# install("git+https://github.com/terrierteam/pyterrier_t5.git")
+# install("protobuf")
+# install("transformers", upgrade=True)
+import random
+import json
+import gradio as gr
+import random
+import time
+import ipdb
+import markdown
+import gradio as gr
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+from utils import login_to_huggingface, ACCESS
+from components.rewrite_passages import rewrite_rag_context
+from components.query_rewriting import rewrite_query
+from components.chat_conversation import (
+    format_message_history,
+    format_user_message,
+    format_context,
+    gradio_to_huggingface_message,
+    huggingface_to_gradio_message,
+    get_system_instruction,
+    prepare_tokenizer,
+    format_rag_context,
+    conversation_window,
+    generate_response,
+)
+from components.constant import (
+    ACCESS,
+    QUERY_REWRITING,
+    RAG,
+    PERSONALITY,
+    PERSONALITY_LIST,
+    REWRITE_PASSAGES,
+    NUM_PASSAGES,
+    DEVICE,
+    RESPONSE_GENERATOR,
+    CONV_WINDOW,
+    API_URL,
+    TEMPLATE_PAYLOAD,
+)
+from components.induce_personality import (
+    build_personality_prompt,
+)
+# LOG_FILE = "log_file_bingzhi_information_seeking.txt"
+LOG_DIR = os.path.join(ROOT_FILE, "log/seperate_preference_elicitation/others/")
+if os.path.exists(LOG_DIR) is False:
+    os.makedirs(LOG_DIR)
+STATIC_FILE = os.path.join(ROOT_FILE, "_static")
+with open(os.path.join(STATIC_FILE, "html/instruction_page.html"), "r") as f:
+    INSTRUCTION_PAGE = f.read()
+with open(os.path.join(STATIC_FILE, "html/evaluation_instruction.html"), "r") as f:
+    EVALUATION_INSTRUCTION = f.read()
+with open(os.path.join(STATIC_FILE, "html/general_instruction.html"), "r") as f:
+    GENERAL_INSTRUCTION = f.read()
+with open(os.path.join(STATIC_FILE, "html/user_narrative.html"), "r") as f:
+    USER_NARRATIVE = f.read()
+with open(os.path.join(STATIC_FILE, "html/system_instruction_preference_elicitation.html"), "r") as f:
+    PREFERENCE_ELICITATION_TASK = f.read()
+with open(os.path.join(STATIC_FILE, "html/final_evaluation.html"), "r") as f:
+    FINAL_EVALUATION = f.read()
+with open(os.path.join(STATIC_FILE, "txt/system_instruction_with_user_persona.txt"), "r") as f:
+    SYSTEM_INSTRUCTION = f.read()
+with open(os.path.join(STATIC_FILE, "txt/system_instruction_without_personalization.txt"), "r") as f:
+    SYSTEM_INSTRUCTION_WITHOUT_PERSONALIZATION = f.read()
+with open(os.path.join(STATIC_FILE, "txt/system_instruction_preference_elicitation.txt"), "r") as f:
+    SYSTEM_INSTRUECTION_PREFERENCE_ELICITATION = f.read()
+with open(os.path.join(STATIC_FILE, "txt/system_summarization_user_preference_elicitation.txt"), "r") as f:
+    SUMMARIZATION_PROMPT = f.read()
+FIRST_MESSAGE = "Hey"
+INFORMATION_SEEKING = True
+USER_PREFERENCE_SUMMARY = True
+DEBUG = False
+# if DEBUG:
+#     CONV_WINDOW = 3
+def get_context(synthetic_data_path):
+    # Load data from the synthetic data file
+    with open(synthetic_data_path, "r") as f:
+        data = [json.loads(line) for line in f]
+    return data
+def add_ticker_prefix(ticker_list, context_list):
+    res = []
+    for ticker, context in zip(ticker_list, context_list):
+        res.append(f"{ticker}: {context}")
+    return res
+def build_raw_context_list(context_dict):
+    return context_dict["data"]
+def build_context(context_dict):
+    return [build_context_element(context) for context in context_dict["data"]]
+def build_context_element(context):
+    # [{topic: ex, data: {}}, {..}, ..]
+    # Extract information from the context
+    ticker = context["ticker"]
+    sector = context["sector"]
+    business_summary = context["business_summary"]
+    name = context["short_name"]
+    stock_price = context["price_data"]
+    earning = context["earning_summary"]
+    beta = context["beta"]
+    # Build the context string
+    stock_candidate = f"Stock Candidate: {name}"
+    stock_info = f"Stock Information: \nIndustry - {sector}, \nBeta (risk indicator) - {beta}, \nEarning Summary - {earning}\n, 2023 Monthly Stock Price - {stock_price}\n, Business Summary - {business_summary}"
+    context_list = [stock_candidate, stock_info]
+    # Combine all parts into a single string
+    return "\n".join(context_list)
+def get_user_narrative_html(user_narrative):
+    return USER_NARRATIVE.replace("{user_narrative}", user_narrative).replace("\n", "<br>")
+def get_task_instruction_for_user(context):
+    ticker_name = context["short_name"]
+    user_narrative = context["user_narrative"]
+    user_narrative = user_narrative.replace("\n", "<br>")
+    html_user_narrative = markdown.markdown(user_narrative)
+    general_instruction = GENERAL_INSTRUCTION
+    round_instruction = f"""
+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <!-- Stock Information (Bold label, Normal ticker name) -->
+    <h2 style="color: #2c3e50; text-align: center; margin-bottom: 20px; font-size: 20px; font-weight: 600;">
+        Round Info
+    </h2>
+    <div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+        Stock
+    </div>
+    <div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+        <span style="font-weight: bold;">
+            This Round's Stock:
+        </span>
+        {ticker_name}
+    </div>
+    <!-- User Narrative (Bold label, Normal narrative) -->
+    <div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+        User Narrative
+    </div>
+    <div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+        {html_user_narrative}
+    </div>
+</div>"""
+    return general_instruction, round_instruction
+def display_system_instruction_with_html(
+    system_instruction,
+):
+    html_system_instruction = f"""
+        <p style="text-align: left; margin-bottom: 10px;">
+            {system_instruction}
+        </p>
+    """
+    return html_system_instruction
+def log_action(tab_name, action, details):
+    """
+    Log actions for each tab (stock).
+    """
+    log_file = os.path.join(LOG_DIR, f"{tab_name}.txt")
+    with open(log_file, "a") as f:
+        f.write(f"Action: {action} | Details: {details}\n")
+def create_demo(
+    terminator,
+    system_description_without_context,
+    stock_context_list,
+    raw_context_list,
+):
+    # Store the history here and use this as an input to each tab.
+    tab_data = {}
+    def tab_creation_exploration_stage(order):
+        comp, context, general_instruction, round_instruction = get_context(order)
+        system_instruction = system_description_without_context + "\n" + context
+        tab_data[comp] = {"history": [], "selection": "", "reason": ""}
+        english_order = ["1", "2", "3", "4", "5"]
+        # with gr.Tab(f"{english_order[order]}: {comp}") as tab:
+        with gr.Tab(f"{english_order[order]}-1:Discuss"):
+            gr.HTML(value=general_instruction, label="General Instruction")
+            with gr.Row():
+                with gr.Column():
+                    with gr.Row():
+                        gr.HTML(
+                            value=round_instruction,
+                            label="Round Instruction",
+                        )
+                with gr.Column():
+                    with gr.Row():
+                        chatbot = gr.Chatbot(height=600)
+                    with gr.Row():
+                        start_conversation = gr.Button(value="Start Conversation")
+                    with gr.Row():
+                        msg = gr.Textbox(scale=1, label="User Input")
+                    with gr.Row():
+                        msg_button = gr.Button(value="Send This Message to Advisor", interactive=False)
+                        continue_button = gr.Button(value="Show More of the Advisor’s Answer", interactive=False)
+            with gr.Row():
+                clear = gr.ClearButton([msg, chatbot])
+            if DEBUG:
+                with gr.Row():
+                    display_prompt = gr.HTML(
+                        value=display_system_instruction_with_html(system_instruction),
+                        label="System Instruction",
+                    )
+        with gr.Tab(f"{english_order[order]}-2:Eval"):
+            with gr.Row():
+                gr.HTML(value=EVALUATION_INSTRUCTION)
+            with gr.Row():
+                dropdown = gr.Dropdown(
+                    label="Would you like to purchase the stock?",
+                    choices=["Yes", "No"],
+                    show_label=True,
+                )
+                reason = gr.Textbox(
+                    scale=1,
+                    label="Reason for Your Choice (Explain Your Reasoning & Highlight Useful Parts of Conversation)",
+                    lines=5,
+                )
+            with gr.Row():
+                trust = gr.Slider(
+                    label="Trust",
+                    minimum=1,
+                    maximum=100,
+                    value=50,
+                    info="How much do you trust the financial advisor? Answer from 1 to 100. A score of 100 means you have complete trust in the financial advisor, while a score of 1 means you have no trust at all.",
+                    step=1,
+                )
+                satisfaction = gr.Slider(
+                    label="Satisfaction",
+                    minimum=1,
+                    maximum=100,
+                    value=50,
+                    info="How satisfied are you with the financial advisor? Answer from 1 to 100. A score of 100 means you are completely satisfied, while a score of 1 means you are not satisfied at all.",
+                    step=1,
+                )
+            with gr.Row():
+                knowledgeable = gr.Slider(
+                    label="Knowledgeable",
+                    minimum=1,
+                    maximum=100,
+                    value=50,
+                    info="How knowledgeable do you feel after interacting with the financial advisor? Answer from 1 to 100. A score of 100 means you feel very knowledgeable, while a score of 1 means you feel not knowledgeable at all.",
+                    step=1,
+                )
+                helpful = gr.Slider(
+                    label="Helpful",
+                    minimum=1,
+                    maximum=100,
+                    value=50,
+                    info="How helpful do you find the financial advisor? Answer from 1 to 100. A score of 100 means you find the financial advisor very helpful, while a score of 1 means you find the financial advisor not helpful at all.",
+                    step=1,
+                )
+            evaluation_send_button = gr.Button(value="Send: Evaluation")
+        return {
+            "comp": comp,
+            "system_instruction": system_instruction,
+            "start_conversation": start_conversation,
+            "msg_button": msg_button,
+            "continue_button": continue_button,
+            "chatbot": chatbot,
+            "msg": msg,
+            "dropdown": dropdown,
+            "reason": reason,
+            "trust": trust,
+            "satisfaction": satisfaction,
+            "knowledgeable": knowledgeable,
+            "helpful": helpful,
+            "evaluation_send_button": evaluation_send_button,
+        }
+    def tab_final_evaluation(first_comp, second_comp, third_comp, fourth_comp, fifth_comp):
+        with gr.Row():
+            gr.HTML(value=FINAL_EVALUATION)
+        with gr.Row():
+            ranking_first_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{first_comp}")
+            ranking_second_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{second_comp}")
+            ranking_third_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{third_comp}")
+            ranking_fourth_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{fourth_comp}")
+            ranking_fifth_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{fifth_comp}")
+        with gr.Row():
+            textbox = gr.HTML(
+                """<div style="background-color: #f8d7da; color: #721c24; padding: 15px; border: 1px solid #f5c6cb; border-radius: 5px; margin-bottom: 20px;">
+                    <strong>Please rank the stocks from 1 to 5, where 1 is the most preferred and 5 is the least preferred.</strong>
+                    <br>
+                    <strong>Make sure to assign different scores to different stocks.</strong>
+                </div>"""
+            )
+            submit_ranking = gr.Button(value="Submit Ranking")
+        return {
+            "first": {"comp": first_comp, "ranking_first_comp": ranking_first_comp},
+            "second": {"comp": second_comp, "ranking_second_comp": ranking_second_comp},
+            "third": {"comp": third_comp, "ranking_third_comp": ranking_third_comp},
+            "fourth": {"comp": fourth_comp, "ranking_fourth_comp": ranking_fourth_comp},
+            "fifth": {"comp": fifth_comp, "ranking_fifth_comp": ranking_fifth_comp},
+            "submit_ranking": submit_ranking,
+            "text_box": textbox,
+        }
+    def click_control_exploration_stage(tabs):
+        (
+            comp,
+            system_instruction,
+            start_conversation,
+            msg_button,
+            continue_button,
+            chatbot,
+            msg,
+            dropdown,
+            reason,
+            trust,
+            satisfaction,
+            knowledgeable,
+            helpful,
+            evaluation_send_button,
+        ) = (
+            tabs["comp"],
+            tabs["system_instruction"],
+            tabs["start_conversation"],
+            tabs["msg_button"],
+            tabs["continue_button"],
+            tabs["chatbot"],
+            tabs["msg"],
+            tabs["dropdown"],
+            tabs["reason"],
+            tabs["trust"],
+            tabs["satisfaction"],
+            tabs["knowledgeable"],
+            tabs["helpful"],
+            tabs["evaluation_send_button"],
+        )
+        start_conversation.click(
+            lambda history: respond_start_conversation(history, system_instruction, comp),
+            [chatbot],
+            [chatbot, start_conversation, msg_button, continue_button],
+        )
+        msg_button.click(
+            lambda message, history: respond(message, tab_data[comp]["history"], system_instruction, comp),
+            [msg, chatbot],
+            [msg, chatbot],
+        )
+        continue_button.click(
+            lambda history: respond_continue(tab_data[comp]["history"], system_instruction, comp),
+            [chatbot],
+            [chatbot],
+        )
+        evaluation_send_button.click(
+            lambda dropdown, reason, trust, satisfaction, knowledgeable, helpful: respond_evaluation(
+                {
+                    "selection": dropdown,
+                    "reason": reason,
+                    "trust": trust,
+                    "satisfaction": satisfaction,
+                    "knowledgeable": knowledgeable,
+                    "helpful": helpful,
+                },
+                comp,
+            ),
+            [dropdown, reason, trust, satisfaction, knowledgeable, helpful],
+            [dropdown, reason, trust, satisfaction, knowledgeable, helpful],
+        )
+    def click_control_final_evaluation(tabs):
+        first_comp, ranking_first_comp = tabs["first"]["comp"], tabs["first"]["ranking_first_comp"]
+        second_comp, ranking_second_comp = tabs["second"]["comp"], tabs["second"]["ranking_second_comp"]
+        third_comp, ranking_third_comp = tabs["third"]["comp"], tabs["third"]["ranking_third_comp"]
+        fourth_comp, ranking_fourth_comp = tabs["fourth"]["comp"], tabs["fourth"]["ranking_fourth_comp"]
+        fifth_comp, ranking_fifth_comp = tabs["fifth"]["comp"], tabs["fifth"]["ranking_fifth_comp"]
+        result_textbox = tabs["text_box"]
+        submit_ranking = tabs["submit_ranking"]
+        submit_ranking.click(
+            lambda ranking_first_comp, ranking_second_comp, ranking_third_comp, ranking_fourth_comp, ranking_fifth_comp: respond_final_ranking(
+                first_comp,
+                ranking_first_comp,
+                second_comp,
+                ranking_second_comp,
+                third_comp,
+                ranking_third_comp,
+                fourth_comp,
+                ranking_fourth_comp,
+                fifth_comp,
+                ranking_fifth_comp,
+            ),
+            # Input components (names and rankings)
+            [
+                ranking_first_comp,
+                ranking_second_comp,
+                ranking_third_comp,
+                ranking_fourth_comp,
+                ranking_fifth_comp,
+            ],
+            # Output component(s) where you want the result to appear, e.g., result_textbox
+            [result_textbox],
+        )
+    def respond(message, history, system_instruction, tab_name=None):
+        """
+        Return:
+        msg
+        chat_history
+        retrieved_passage
+        rewritten_query
+        """
+        assert (
+            tab_name is not None
+        ), "Tab name is required for the start of the conversation unless it is not preference elicitation."
+        # Formatting Input
+        print(f"User Message: {message} in Tab: {tab_name}")
+        # From string to list [{"role":"user", "content": message}, ...]
+        history = gradio_to_huggingface_message(history)
+        # We can implement context window here as we need all the system interaction. We can cut some of the early interactions if needed.
+        history = conversation_window(history, CONV_WINDOW)
+        print(f"History Length: {len(history)}")
+        print(f"History: {history}")
+        # Add system instruction to the history
+        history = format_context(system_instruction, history)
+        # Add user message to the history
+        history_with_user_utterance = format_user_message(message, history)
+        # Call API instead of locally handle it
+        outputs_text, history = generate_response(history_with_user_utterance, terminator, 128, API_URL)
+        # exclude system interaction and store the others in the history
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            print(f"Tab: {tab_name}\nSystem Output: {outputs_text}")
+            # Log the user message and response
+            log_action(tab_name, "User Message", message)
+            log_action(tab_name, "Response", outputs_text)
+            # Store the updated history for this tab
+            tab_data[tab_name]["history"] = history
+        return "", history
+    def respond_start_conversation(history, system_instruction, tab_name=None):
+        assert (
+            tab_name is not None
+        ), "Tab name is required for the start of the conversation unless it is not preference elicitation."
+        print(f"Tab: {tab_name}\nSystem Instruction:{system_instruction}")
+        history = gradio_to_huggingface_message(history)
+        history = format_context(system_instruction, history)
+        first_message = FIRST_MESSAGE
+        history_with_user_utterance = format_user_message(first_message, history)
+        outputs_text, history = generate_response(history_with_user_utterance, terminator, 128, API_URL)
+        # Format
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            print(f"Tab: {tab_name}\nHistory: {history}")
+            # Log the user message and response
+            log_action(tab_name, "User Message", first_message)
+            log_action(tab_name, "Response", outputs_text)
+            # Store the updated history for this tab
+            tab_data[tab_name]["history"] = history
+        return (
+            history,
+            gr.Button(value="Start Conversation", interactive=False),
+            gr.Button(value="Send This Message to Advisor", interactive=True),
+            gr.Button(value="Show More of the Advisor’s Answer", interactive=True),
+        )
+    def respond_continue(history, system_instruction, tab_name=None):
+        assert tab_name is not None, "Tab name is required for the start of the conversation."
+        # print(f"Tab: {tab_name}\nSystem Instruction:{system_instruction}")
+        message = "continue"
+        history = gradio_to_huggingface_message(history)
+        history = conversation_window(history, CONV_WINDOW)
+        history = format_context(system_instruction, history)
+        history_with_user_utterance = format_user_message(message, history)
+        outputs_text, history = generate_response(history_with_user_utterance, terminator, 128, API_URL)
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            log_action(tab_name, "Show More of the Advisor’s Answer", "User continued the conversation")
+            log_action(tab_name, "Response", outputs_text)
+            # Update history for this tab
+            tab_data[tab_name]["history"] = history
+        return history
+    def respond_evaluation(evals, tab_name):
+        # dropdown, readon_button, multi-evaluator
+        log_action(tab_name, "Round Evaluation", "Following")
+        for key, value in evals.items():
+            log_action(tab_name, key, value)
+        # Store the reason for this tab
+        tab_data[tab_name]["multi_evaluator"] = evals
+        return (
+            evals["selection"],
+            evals["reason"],
+            evals["trust"],
+            evals["satisfaction"],
+            evals["knowledgeable"],
+            evals["helpful"],
+        )
+    def respond_final_ranking(
+        first_comp,
+        ranking_first_comp,
+        second_comp,
+        ranking_second_comp,
+        third_comp,
+        ranking_third_comp,
+        fourth_comp,
+        ranking_fourth_comp,
+        fifth_comp,
+        ranking_fifth_comp,
+    ):
+        # make sure that they are not the same
+        ranking_list = [
+            ranking_first_comp,
+            ranking_second_comp,
+            ranking_third_comp,
+            ranking_fourth_comp,
+            ranking_fifth_comp,
+        ]
+        if len(set(ranking_list)) != len(ranking_list):
+            return """<div style="background-color: #fff3cd; color: #856404; padding: 15px; border: 1px solid #ffeeba; border-radius: 5px; margin-bottom: 20px;">
+                        <strong>Please make sure that you are not ranking the same stock multiple times.</strong>
+                    </div>"""
+        else:
+            log_action("Final_Ranking", first_comp, ranking_first_comp)
+            log_action("Final_Ranking", second_comp, ranking_second_comp)
+            log_action("Final_Ranking", third_comp, ranking_third_comp)
+            log_action("Final_Ranking", fourth_comp, ranking_fourth_comp)
+            log_action("Final_Ranking", fifth_comp, ranking_fifth_comp)
+            return """<div style="background-color: #d4edda; color: #155724; padding: 15px; border: 1px solid #c3e6cb; border-radius: 5px; margin-bottom: 20px;">
+                        <strong>Thank you for participating in the experiment. This concludes the session. You may now close the tab.</strong>
+                    </div>"""
+    def get_context(index):
+        comp = raw_context_list[index]["short_name"]
+        context = stock_context_list[index]
+        general_instruction, round_instruction = get_task_instruction_for_user(raw_context_list[index])
+        return comp, context, general_instruction, round_instruction
+    with gr.Blocks(title="RAG Chatbot Q&A", theme="Soft") as demo:
+        first_comp, first_context, first_general_instruction, first_round_instruction = get_context(0)
+        second_comp, second_context, second_general_instruction, second_round_instruction = get_context(1)
+        third_comp, third_context, third_general_instruction, third_round_instruction = get_context(2)
+        fourth_comp, fourth_context, forth_general_instruction, forth_round_instruction = get_context(3)
+        fifth_comp, fifth_context, fifth_general_instruction, fifth_round_instruction = get_context(4)
+        user_narrative = markdown.markdown(raw_context_list[0]["user_narrative"].replace("\n", "<br>"))
+        # # initialize tab data
+        for comp in [first_comp, second_comp, third_comp, fourth_comp, fifth_comp]:
+            tab_data[comp] = {"history": [], "selection": "", "reason": ""}
+        # EXperiment Instruction
+        with gr.Tab("Experiment Instruction") as instruction_tab:
+            gr.HTML(value=INSTRUCTION_PAGE, label="Experiment Instruction")
+        # Financial decision making stage
+        with gr.Tab("Financial Decision Stage"):
+            # Experiment Tag
+            first_tab = tab_creation_exploration_stage(0)
+            click_control_exploration_stage(first_tab)
+            second_tab = tab_creation_exploration_stage(1)
+            click_control_exploration_stage(second_tab)
+            third_tab = tab_creation_exploration_stage(2)
+            click_control_exploration_stage(third_tab)
+            fourth_tab = tab_creation_exploration_stage(3)
+            click_control_exploration_stage(fourth_tab)
+            fifth_tab = tab_creation_exploration_stage(4)
+            click_control_exploration_stage(fifth_tab)
+        with gr.Tab("Final Evaluation Stage") as final_evaluation:
+            final_evaluation_tab = tab_final_evaluation(first_comp, second_comp, third_comp, fourth_comp, fifth_comp)
+            click_control_final_evaluation(final_evaluation_tab)
+    return demo
+if __name__ == "__main__":
+    login_to_huggingface(ACCESS)
+    file_path = os.path.join(ROOT_FILE, "./data/single_stock_data/single_stock_demo.jsonl")
+    context_info = get_context(file_path)  # str to List of Dict
+    # For Demo Usage, just use the first dict
+    context_info = context_info[0]
+    stock_context_list = build_context(context_info)  # List of str
+    raw_context_list = build_raw_context_list(context_info)  # List of str
+    # system instruction consist of Task, Personality, and Context
+    """
+    Personality
+    ["extroverted", "introverted"]
+    ["agreeable", "antagonistic"]
+    ["conscientious", "unconscientious"]
+    ["neurotic", "emotionally stable"]
+    ["open to experience", "closed to experience"]]
+    """
+    personality = [
+        "extroverted",
+        "agreeable",
+        "conscientious",
+        "emotionally stable",
+        "open to experience",
+    ]
+    personality_prompt = build_personality_prompt(personality)
+    system_instruction_without_context = SYSTEM_INSTRUCTION_WITHOUT_PERSONALIZATION + "\n" + personality_prompt + "\n"
+    tokenizer = AutoTokenizer.from_pretrained(RESPONSE_GENERATOR)
+    tokenizer, terminator = prepare_tokenizer(tokenizer)
+    demo = create_demo(terminator, system_instruction_without_context, stock_context_list, raw_context_list)
+    demo.launch(share=True)

experiments/personality_simulation.py ADDED Viewed

	@@ -0,0 +1,60 @@

+import os
+import ipdb
+import itertools
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+from tqdm import tqdm
+import json
+from utils import login_to_huggingface, ACCESS
+from components.rag_components import rag, retrieve_passage, response_generation
+from components.rewrite_passages import rewrite_rag_context
+from components.query_rewriting import rewrite_query
+from components.chat_conversation import format_message_history, format_user_message, format_context, gradio_to_huggingface_message, huggingface_to_gradio_message, get_system_instruction, prepare_tokenizer, format_rag_context
+from components.constant import ACCESS, QUERY_REWRITING, RAG, DEVICE, RESPONSE_GENERATOR, NUM_PASSAGES
+from components.prompt import SYSTEM_INSTRUCTION, RAG_INSTRUCTION, PERSONALITY_INSTRUCTION
+from components.induce_personality import construct_big_five_words
+def get_conversation_hitory(persona_type, user_predefined_message, tokenizer, model, terminator):
+    # Output: conversation history {"role": "user", "content": "message"}
+    assert len(user_predefined_message) >= 1, "User message should be at least one"
+    system_instruction = get_system_instruction(rag=RAG, personality_list=persona_type)
+    messages = [{"role": "system", "content": system_instruction}]
+    for user_message in user_predefined_message:
+        if QUERY_REWRITING:
+            str_history = format_message_history(user_message, messages)
+            resolved_query = rewrite_query(user_message, str_history, model, tokenizer, terminator, device=DEVICE)
+        else:
+            resolved_query = user_message
+        messages = format_user_message(resolved_query, messages)
+        # TODO implement rag function as this will be important later
+        _, messages = response_generation(messages, model, tokenizer, device=DEVICE, terminators=terminator)
+    return messages
+def store_conversation_to_text(filename, conversation):
+    with open(filename, "w") as file:
+        for turn in conversation:
+            file.write(f"{turn['role']}: {turn['content']}\n")
+        file.write("\n")  # Add a newline at the end of the conversation
+if __name__ == "__main__":
+    output_par_dir = "./output/personality_output"
+    personality_types = [["extroverted", "introverted"], ["agreeable", "antagonistic"], ["conscientious", "unconscientious"], ["neurotic", "emotionally stable"], ["open to experience", "closed to experience"]]
+    # load case
+    with open("user_predefined_queries.json", "r") as file:
+        user_q = json.load(file)
+    tokenizer = AutoTokenizer.from_pretrained(RESPONSE_GENERATOR)
+    tokenizer, terminator = prepare_tokenizer(tokenizer)
+    model = AutoModelForCausalLM.from_pretrained(RESPONSE_GENERATOR, torch_dtype=torch.float16, pad_token_id=tokenizer.eos_token_id).to(DEVICE)
+    for case_name, user_predefined_message in user_q.items():
+        for persona_type in tqdm(itertools.product(*personality_types)):
+            conv_hist = get_conversation_hitory(persona_type, user_predefined_message, tokenizer, model, terminator)
+            save_file_name = "_".join(persona_type) + ".txt"
+            output_dir = os.path.join(output_par_dir, case_name)
+            if not os.path.exists(output_dir):
+                os.makedirs(output_dir, exist_ok=True)
+            save_file_path = os.path.join(output_dir, save_file_name)
+            store_conversation_to_text(save_file_path, conv_hist)

experiments/separate_preference_elicitation_and_interaction.py ADDED Viewed

	@@ -0,0 +1,851 @@

+import subprocess
+import sys
+import os
+ROOT_FILE = os.path.join(os.path.dirname(os.path.abspath(__file__)), "../")
+sys.path.append(ROOT_FILE)
+from components.induce_personality import construct_big_five_words
+# need to import: gradio
+def install(package, upgrade=False):
+    if upgrade:
+        subprocess.run(
+            [
+                sys.executable,
+                "-m",
+                "pip",
+                "install",
+                "--upgrade",
+                package,
+            ],
+            check=True,
+        )
+    else:
+        subprocess.run(
+            [
+                sys.executable,
+                "-m",
+                "pip",
+                "install",
+                package,
+            ],
+            check=True,
+        )
+# install("ipdb")
+# install("gradio")
+# install("sentence-transformers")
+# install("git+https://github.com/terrierteam/pyterrier_t5.git")
+# install("protobuf")
+# install("transformers", upgrade=True)
+import random
+import json
+import gradio as gr
+import random
+import time
+import ipdb
+import markdown
+import gradio as gr
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+from utils import login_to_huggingface, ACCESS
+from components.rag_components import (
+    rag,
+    retrieve_passage,
+    response_generation,
+)
+from components.rewrite_passages import rewrite_rag_context
+from components.query_rewriting import rewrite_query
+from components.chat_conversation import (
+    format_message_history,
+    format_user_message,
+    format_context,
+    gradio_to_huggingface_message,
+    huggingface_to_gradio_message,
+    get_system_instruction,
+    prepare_tokenizer,
+    format_rag_context,
+    conversation_window,
+)
+from components.constant import (
+    ACCESS,
+    QUERY_REWRITING,
+    RAG,
+    PERSONALITY,
+    PERSONALITY_LIST,
+    REWRITE_PASSAGES,
+    NUM_PASSAGES,
+    DEVICE,
+    RESPONSE_GENERATOR,
+    CONV_WINDOW,
+)
+from components.induce_personality import (
+    build_personality_prompt,
+)
+# LOG_FILE = "log_file_bingzhi_information_seeking.txt"
+LOG_DIR = os.path.join(ROOT_FILE, "log/seperate_preference_elicitation/others/")
+if os.path.exists(LOG_DIR) is False:
+    os.makedirs(LOG_DIR)
+STATIC_FILE = os.path.join(ROOT_FILE, "_static")
+with open(os.path.join(STATIC_FILE, "html/instruction_page.html"), "r") as f:
+    INSTRUCTION_PAGE = f.read()
+with open(os.path.join(STATIC_FILE, "html/evaluation_instruction.html"), "r") as f:
+    EVALUATION_INSTRUCTION = f.read()
+with open(os.path.join(STATIC_FILE, "html/general_instruction.html"), "r") as f:
+    GENERAL_INSTRUCTION = f.read()
+with open(os.path.join(STATIC_FILE, "html/user_narrative.html"), "r") as f:
+    USER_NARRATIVE = f.read()
+with open(os.path.join(STATIC_FILE, "html/system_instruction_preference_elicitation.html"), "r") as f:
+    PREFERENCE_ELICITATION_TASK = f.read()
+with open(os.path.join(STATIC_FILE, "html/final_evaluation.html"), "r") as f:
+    FINAL_EVALUATION = f.read()
+with open(os.path.join(STATIC_FILE, "txt/system_instruction_with_user_persona.txt"), "r") as f:
+    SYSTEM_INSTRUCTION = f.read()
+with open(os.path.join(STATIC_FILE, "txt/system_instruction_preference_elicitation.txt"), "r") as f:
+    SYSTEM_INSTRUECTION_PREFERENCE_ELICITATION = f.read()
+with open(os.path.join(STATIC_FILE, "txt/system_summarization_user_preference_elicitation.txt"), "r") as f:
+    SUMMARIZATION_PROMPT = f.read()
+FIRST_MESSAGE = "Hey"
+INFORMATION_SEEKING = True
+USER_PREFERENCE_SUMMARY = True
+DEBUG = True
+# if DEBUG:
+#     CONV_WINDOW = 3
+def get_context(synthetic_data_path):
+    # Load data from the synthetic data file
+    with open(synthetic_data_path, "r") as f:
+        data = [json.loads(line) for line in f]
+    return data
+def add_ticker_prefix(ticker_list, context_list):
+    res = []
+    for ticker, context in zip(ticker_list, context_list):
+        res.append(f"{ticker}: {context}")
+    return res
+def build_raw_context_list(context_dict):
+    return context_dict["data"]
+def build_context(context_dict):
+    return [build_context_element(context) for context in context_dict["data"]]
+def build_context_element(context):
+    # [{topic: ex, data: {}}, {..}, ..]
+    # Extract information from the context
+    ticker = context["ticker"]
+    sector = context["sector"]
+    business_summary = context["business_summary"]
+    name = context["short_name"]
+    stock_price = context["price_data"]
+    earning = context["earning_summary"]
+    beta = context["beta"]
+    # Build the context string
+    stock_candidate = f"Stock Candidate: {name}"
+    stock_info = f"Stock Information: \nIndustry - {sector}, \nBeta (risk indicator) - {beta}, \nEarning Summary - {earning}\n, 2023 Monthly Stock Price - {stock_price}\n, Business Summary - {business_summary}"
+    context_list = [stock_candidate, stock_info]
+    # Combine all parts into a single string
+    return "\n".join(context_list)
+def get_user_narrative_html(user_narrative):
+    return USER_NARRATIVE.replace("{user_narrative}", user_narrative).replace("\n", "<br>")
+def get_task_instruction_for_user(context):
+    ticker_name = context["short_name"]
+    user_narrative = context["user_narrative"]
+    user_narrative = user_narrative.replace("\n", "<br>")
+    html_user_narrative = markdown.markdown(user_narrative)
+    general_instruction = GENERAL_INSTRUCTION
+    round_instruction = f"""
+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <!-- Stock Information (Bold label, Normal ticker name) -->
+    <h2 style="color: #2c3e50; text-align: center; margin-bottom: 20px; font-size: 20px; font-weight: 600;">
+        Round Info
+    </h2>
+    <div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+        Stock
+    </div>
+    <div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+        <span style="font-weight: bold;">
+            This Round's Stock:
+        </span>
+        {ticker_name}
+    </div>
+    <!-- User Narrative (Bold label, Normal narrative) -->
+    <div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+        User Narrative
+    </div>
+    <div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+        {html_user_narrative}
+    </div>
+</div>"""
+    return general_instruction, round_instruction
+def display_system_instruction_with_html(
+    system_instruction,
+):
+    html_system_instruction = f"""
+        <p style="text-align: left; margin-bottom: 10px;">
+            {system_instruction}
+        </p>
+    """
+    return html_system_instruction
+def log_action(tab_name, action, details):
+    """
+    Log actions for each tab (stock).
+    """
+    log_file = os.path.join(LOG_DIR, f"{tab_name}.txt")
+    with open(log_file, "a") as f:
+        f.write(f"Action: {action} | Details: {details}\n")
+def add_user_profile_to_system_instruction(
+    system_instruction, user_preference_elicitation_data, summary, model, terminator
+):
+    if summary:
+        if user_preference_elicitation_data["summary_history"] == "":
+            # Format prompt
+            summarization_prompt = SUMMARIZATION_PROMPT + "\nPrevious Conversations: {}".format(
+                user_preference_elicitation_data["history"]
+            )
+            summarization_instruction = [{"role": "system", "content": summarization_prompt}]
+            summ, _ = response_generation(
+                summarization_instruction,
+                model,
+                tokenizer,
+                max_tokens=512,
+                device=DEVICE,
+                terminators=terminator,
+            )
+            user_preference_elicitation_data["summary_history"] = summ
+            log_action("Prompt", "Preference Elicitation Summarization", summ)
+            print(f"Preference Summary:{summ}")
+        system_instruction += f"\nPrevious Conversations with the Customer about the User Profile: {user_preference_elicitation_data['summary_history']}\n"
+    else:
+        system_instruction += f"\nPrevious Conversations with the Customer about the User Profile: {user_preference_elicitation_data['history']}\n"
+    return system_instruction
+def create_demo(
+    model,
+    tokenizer,
+    terminator,
+    system_description_without_context,
+    stock_context_list,
+    raw_context_list,
+):
+    # Store the history here and use this as an input to each tab.
+    tab_data = {}
+    user_preference_elicitation_data = {"history": "", "summary_history": ""}
+    if DEBUG:
+        user_preference_elicitation_data[
+            "summary_history"
+        ] = """Previous Conversations with the Customer about the User Profile: Based on our previous conversation, here's a summary of your investment preferences:
+        1. **Preferred Industries:** You're interested in investing in the healthcare sector, without a specific preference for sub-industries such as pharmaceuticals, medical devices, biotechnology, or healthcare services.
+        2. **Value vs. Growth Stocks:** You prefer growth stocks, which have the potential for high returns but may be riskier.
+        3. **Dividend vs. Non-Dividend Stocks:** You're open to both dividend and non-dividend growth stocks, focusing on reinvesting profits for future growth.
+        4. **Cyclical vs. Non-Cyclical Stocks:** You're interested in cyclical stocks, which are sensitive to economic fluctuations and tend to perform well during economic expansions."""
+    def tab_creation_exploration_stage(order):
+        comp, context, general_instruction, round_instruction = get_context(order)
+        system_instruction = system_description_without_context + "\n" + context
+        tab_data[comp] = {"history": [], "selection": "", "reason": ""}
+        english_order = ["1", "2", "3", "4", "5"]
+        # with gr.Tab(f"{english_order[order]}: {comp}") as tab:
+        with gr.Tab(f"{english_order[order]}-1:Discuss"):
+            gr.HTML(value=general_instruction, label="General Instruction")
+            with gr.Row():
+                with gr.Column():
+                    with gr.Row():
+                        gr.HTML(
+                            value=round_instruction,
+                            label="Round Instruction",
+                        )
+                with gr.Column():
+                    with gr.Row():
+                        chatbot = gr.Chatbot(height=600)
+                    with gr.Row():
+                        start_conversation = gr.Button(value="Start Conversation")
+                    with gr.Row():
+                        msg = gr.Textbox(scale=1, label="User Input")
+                    with gr.Row():
+                        msg_button = gr.Button(value="Send This Message to Advisor", interactive=False)
+                        continue_button = gr.Button(value="Show More of the Advisor’s Answer", interactive=False)
+            with gr.Row():
+                clear = gr.ClearButton([msg, chatbot])
+            if DEBUG:
+                with gr.Row():
+                    display_prompt = gr.HTML(
+                        value=display_system_instruction_with_html(system_instruction),
+                        label="System Instruction",
+                    )
+        with gr.Tab(f"{english_order[order]}-2:Eval"):
+            with gr.Row():
+                gr.HTML(value=EVALUATION_INSTRUCTION)
+            with gr.Row():
+                dropdown = gr.Dropdown(
+                    label="Would you like to purchase the stock?",
+                    choices=["Yes", "No"],
+                    show_label=True,
+                )
+                reason = gr.Textbox(
+                    scale=1,
+                    label="Reason for Your Choice (Explain Your Reasoning & Highlight Useful Parts of Conversation)",
+                    lines=5,
+                )
+            with gr.Row():
+                trust = gr.Slider(
+                    label="Trust",
+                    minimum=1,
+                    maximum=100,
+                    value=50,
+                    info="How much do you trust the financial advisor? Answer from 1 to 100. A score of 100 means you have complete trust in the financial advisor, while a score of 1 means you have no trust at all.",
+                    step=1,
+                )
+                satisfaction = gr.Slider(
+                    label="Satisfaction",
+                    minimum=1,
+                    maximum=100,
+                    value=50,
+                    info="How satisfied are you with the financial advisor? Answer from 1 to 100. A score of 100 means you are completely satisfied, while a score of 1 means you are not satisfied at all.",
+                    step=1,
+                )
+            with gr.Row():
+                knowledgeable = gr.Slider(
+                    label="Knowledgeable",
+                    minimum=1,
+                    maximum=100,
+                    value=50,
+                    info="How knowledgeable do you feel after interacting with the financial advisor? Answer from 1 to 100. A score of 100 means you feel very knowledgeable, while a score of 1 means you feel not knowledgeable at all.",
+                    step=1,
+                )
+                helpful = gr.Slider(
+                    label="Helpful",
+                    minimum=1,
+                    maximum=100,
+                    value=50,
+                    info="How helpful do you find the financial advisor? Answer from 1 to 100. A score of 100 means you find the financial advisor very helpful, while a score of 1 means you find the financial advisor not helpful at all.",
+                    step=1,
+                )
+            evaluation_send_button = gr.Button(value="Send: Evaluation")
+        return {
+            "comp": comp,
+            "system_instruction": system_instruction,
+            "start_conversation": start_conversation,
+            "msg_button": msg_button,
+            "continue_button": continue_button,
+            "chatbot": chatbot,
+            "msg": msg,
+            "dropdown": dropdown,
+            "reason": reason,
+            "trust": trust,
+            "satisfaction": satisfaction,
+            "knowledgeable": knowledgeable,
+            "helpful": helpful,
+            "evaluation_send_button": evaluation_send_button,
+        }
+    def tab_creation_preference_stage():
+        with gr.Row():
+            gr.HTML(value=PREFERENCE_ELICITATION_TASK, label="Preference Elicitation Task")
+        with gr.Row():
+            with gr.Column():
+                whole_user_narrative = get_user_narrative_html(user_narrative)
+                gr.HTML(value=whole_user_narrative, label="User Narrative")
+            with gr.Column():
+                with gr.Row():
+                    elicitation_chatbot = gr.Chatbot(height=600)
+                with gr.Row():
+                    start_conversation = gr.Button(value="Start Conversation")
+                with gr.Row():
+                    msg = gr.Textbox(scale=1, label="User Input")
+                with gr.Row():
+                    msg_button = gr.Button(value="Send This Message to Advisor", interactive=False)
+                    continue_button = gr.Button(value="Show More of the Advisor’s Answer", interactive=False)
+        return {
+            "start_conversation": start_conversation,
+            "msg_button": msg_button,
+            "continue_button": continue_button,
+            "msg": msg,
+            "elicitation_chatbot": elicitation_chatbot,
+        }
+    def tab_final_evaluation(first_comp, second_comp, third_comp, fourth_comp, fifth_comp):
+        with gr.Row():
+            gr.HTML(value=FINAL_EVALUATION)
+        with gr.Row():
+            ranking_first_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{first_comp}")
+            ranking_second_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{second_comp}")
+            ranking_third_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{third_comp}")
+            ranking_fourth_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{fourth_comp}")
+            ranking_fifth_comp = gr.Dropdown(choices=[1, 2, 3, 4, 5], label=f"{fifth_comp}")
+        with gr.Row():
+            textbox = gr.HTML(
+                """<div style="background-color: #f8d7da; color: #721c24; padding: 15px; border: 1px solid #f5c6cb; border-radius: 5px; margin-bottom: 20px;">
+                    <strong>Please rank the stocks from 1 to 5, where 1 is the most preferred and 5 is the least preferred.</strong>
+                    <br>
+                    <strong>Make sure to assign different scores to different stocks.</strong>
+                </div>"""
+            )
+            submit_ranking = gr.Button(value="Submit Ranking")
+        return {
+            "first": {"comp": first_comp, "ranking_first_comp": ranking_first_comp},
+            "second": {"comp": second_comp, "ranking_second_comp": ranking_second_comp},
+            "third": {"comp": third_comp, "ranking_third_comp": ranking_third_comp},
+            "fourth": {"comp": fourth_comp, "ranking_fourth_comp": ranking_fourth_comp},
+            "fifth": {"comp": fifth_comp, "ranking_fifth_comp": ranking_fifth_comp},
+            "submit_ranking": submit_ranking,
+            "text_box": textbox,
+        }
+    def click_control_exploration_stage(tabs):
+        (
+            comp,
+            system_instruction,
+            start_conversation,
+            msg_button,
+            continue_button,
+            chatbot,
+            msg,
+            dropdown,
+            reason,
+            trust,
+            satisfaction,
+            knowledgeable,
+            helpful,
+            evaluation_send_button,
+        ) = (
+            tabs["comp"],
+            tabs["system_instruction"],
+            tabs["start_conversation"],
+            tabs["msg_button"],
+            tabs["continue_button"],
+            tabs["chatbot"],
+            tabs["msg"],
+            tabs["dropdown"],
+            tabs["reason"],
+            tabs["trust"],
+            tabs["satisfaction"],
+            tabs["knowledgeable"],
+            tabs["helpful"],
+            tabs["evaluation_send_button"],
+        )
+        start_conversation.click(
+            lambda history: respond_start_conversation(history, system_instruction, comp),
+            [chatbot],
+            [chatbot, start_conversation, msg_button, continue_button],
+        )
+        msg_button.click(
+            lambda message, history: respond(message, tab_data[comp]["history"], system_instruction, comp),
+            [msg, chatbot],
+            [msg, chatbot],
+        )
+        continue_button.click(
+            lambda history: respond_continue(tab_data[comp]["history"], system_instruction, comp),
+            [chatbot],
+            [chatbot],
+        )
+        evaluation_send_button.click(
+            lambda dropdown, reason, trust, satisfaction, knowledgeable, helpful: respond_evaluation(
+                {
+                    "selection": dropdown,
+                    "reason": reason,
+                    "trust": trust,
+                    "satisfaction": satisfaction,
+                    "knowledgeable": knowledgeable,
+                    "helpful": helpful,
+                },
+                comp,
+            ),
+            [dropdown, reason, trust, satisfaction, knowledgeable, helpful],
+            [dropdown, reason, trust, satisfaction, knowledgeable, helpful],
+        )
+    def click_control_preference_stage(tabs):
+        (
+            start_conversation,
+            msg_button,
+            continue_button,
+            elicitation_chatbot,
+            msg,
+        ) = (
+            tabs["start_conversation"],
+            tabs["msg_button"],
+            tabs["continue_button"],
+            tabs["elicitation_chatbot"],
+            tabs["msg"],
+        )
+        start_conversation.click(
+            lambda history: respond_start_conversation(
+                history, SYSTEM_INSTRUECTION_PREFERENCE_ELICITATION, user_elicitation=True
+            ),
+            [elicitation_chatbot],
+            [elicitation_chatbot, start_conversation, msg_button, continue_button],
+        )
+        msg_button.click(
+            lambda message, history: respond(
+                message,
+                user_preference_elicitation_data["history"],
+                SYSTEM_INSTRUECTION_PREFERENCE_ELICITATION,
+                user_elicitation=True,
+            ),
+            [msg, elicitation_chatbot],
+            [msg, elicitation_chatbot],
+        )
+        continue_button.click(
+            lambda history: respond_continue(
+                user_preference_elicitation_data["history"],
+                SYSTEM_INSTRUECTION_PREFERENCE_ELICITATION,
+                user_elicitation=True,
+            ),
+            [elicitation_chatbot],
+            [elicitation_chatbot],
+        )
+    def click_control_final_evaluation(tabs):
+        first_comp, ranking_first_comp = tabs["first"]["comp"], tabs["first"]["ranking_first_comp"]
+        second_comp, ranking_second_comp = tabs["second"]["comp"], tabs["second"]["ranking_second_comp"]
+        third_comp, ranking_third_comp = tabs["third"]["comp"], tabs["third"]["ranking_third_comp"]
+        fourth_comp, ranking_fourth_comp = tabs["fourth"]["comp"], tabs["fourth"]["ranking_fourth_comp"]
+        fifth_comp, ranking_fifth_comp = tabs["fifth"]["comp"], tabs["fifth"]["ranking_fifth_comp"]
+        result_textbox = tabs["text_box"]
+        submit_ranking = tabs["submit_ranking"]
+        submit_ranking.click(
+            lambda ranking_first_comp, ranking_second_comp, ranking_third_comp, ranking_fourth_comp, ranking_fifth_comp: respond_final_ranking(
+                first_comp,
+                ranking_first_comp,
+                second_comp,
+                ranking_second_comp,
+                third_comp,
+                ranking_third_comp,
+                fourth_comp,
+                ranking_fourth_comp,
+                fifth_comp,
+                ranking_fifth_comp,
+            ),
+            # Input components (names and rankings)
+            [
+                ranking_first_comp,
+                ranking_second_comp,
+                ranking_third_comp,
+                ranking_fourth_comp,
+                ranking_fifth_comp,
+            ],
+            # Output component(s) where you want the result to appear, e.g., result_textbox
+            [result_textbox],
+        )
+    def respond(message, history, system_instruction, tab_name=None, user_elicitation=False):
+        """
+        Return:
+        msg
+        chat_history
+        retrieved_passage
+        rewritten_query
+        """
+        assert (
+            tab_name is not None or user_elicitation is True
+        ), "Tab name is required for the start of the conversation unless it is not preference elicitation."
+        # Add user profile to system instruction
+        if not user_elicitation:
+            system_instruction = add_user_profile_to_system_instruction(
+                system_instruction,
+                user_preference_elicitation_data,
+                summary=USER_PREFERENCE_SUMMARY,
+                model=model,
+                terminator=terminator,
+            )
+            # print(f"Tab: {tab_name}\nSystem Instruction:{system_instruction}")
+        # Formatting Input
+        print(f"User Message: {message} in Tab: {tab_name}")
+        # From string to list [{"role":"user", "content": message}, ...]
+        history = gradio_to_huggingface_message(history)
+        # We can implement context window here as we need all the system interaction. We can cut some of the early interactions if needed.
+        history = conversation_window(history, CONV_WINDOW)
+        print(f"History Length: {len(history)}")
+        print(f"History: {history}")
+        # Add system instruction to the history
+        history = format_context(system_instruction, history)
+        # Add user message to the history
+        history_with_user_utterance = format_user_message(message, history)
+        outputs_text, history = response_generation(
+            history_with_user_utterance,
+            model,
+            tokenizer,
+            max_tokens=128,
+            device=DEVICE,
+            terminators=terminator,
+        )
+        # exclude system interaction and store the others in the history
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            print(f"Tab: {tab_name}\nSystem Output: {outputs_text}")
+            # Log the user message and response
+            log_action(tab_name, "User Message", message)
+            log_action(tab_name, "Response", outputs_text)
+            # Store the updated history for this tab
+            tab_data[tab_name]["history"] = history
+        if user_elicitation:
+            print(f"User Elicitation\nSystem Output: {outputs_text}")
+            log_action("User_Elicitation", "User Message", message)
+            log_action("User_Elicitation", "Response", outputs_text)
+            user_preference_elicitation_data["history"] = history
+        return "", history
+    def respond_start_conversation(history, system_instruction, tab_name=None, user_elicitation=False):
+        assert (
+            tab_name is not None or user_elicitation is True
+        ), "Tab name is required for the start of the conversation unless it is not preference elicitation."
+        if not user_elicitation:
+            system_instruction = add_user_profile_to_system_instruction(
+                system_instruction,
+                user_preference_elicitation_data,
+                summary=USER_PREFERENCE_SUMMARY,
+                model=model,
+                terminator=terminator,
+            )
+            print(f"Tab: {tab_name}\nSystem Instruction:{system_instruction}")
+        history = gradio_to_huggingface_message(history)
+        history = format_context(system_instruction, history)
+        first_message = FIRST_MESSAGE
+        history_with_user_utterance = format_user_message(first_message, history)
+        outputs_text, history = response_generation(
+            history_with_user_utterance,
+            model,
+            tokenizer,
+            max_tokens=128,
+            device=DEVICE,
+            terminators=terminator,
+        )
+        # Format
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            print(f"Tab: {tab_name}\nHistory: {history}")
+            # Log the user message and response
+            log_action(tab_name, "User Message", first_message)
+            log_action(tab_name, "Response", outputs_text)
+            # Store the updated history for this tab
+            tab_data[tab_name]["history"] = history
+        if user_elicitation:
+            print(f"User Elicitation\nHistory: {history}")
+            log_action("User_Elicitation", "User Message", first_message)
+            log_action("User_Elicitation", "Response", outputs_text)
+            user_preference_elicitation_data["history"] = history
+        return (
+            history,
+            gr.Button(value="Start Conversation", interactive=False),
+            gr.Button(value="Send This Message to Advisor", interactive=True),
+            gr.Button(value="Show More of the Advisor’s Answer", interactive=True),
+        )
+    def respond_continue(history, system_instruction, tab_name=None, user_elicitation=False):
+        assert (
+            tab_name is not None or user_elicitation is True
+        ), "Tab name is required for the start of the conversation."
+        # Add user profile to system instruction
+        if not user_elicitation:
+            system_instruction = add_user_profile_to_system_instruction(
+                system_instruction,
+                user_preference_elicitation_data,
+                summary=USER_PREFERENCE_SUMMARY,
+                model=model,
+                terminator=terminator,
+            )
+            # print(f"Tab: {tab_name}\nSystem Instruction:{system_instruction}")
+        message = "continue"
+        history = gradio_to_huggingface_message(history)
+        history = conversation_window(history, CONV_WINDOW)
+        history = format_context(system_instruction, history)
+        history_with_user_utterance = format_user_message(message, history)
+        outputs_text, history = response_generation(
+            history_with_user_utterance,
+            model,
+            tokenizer,
+            max_tokens=128,
+            device=DEVICE,
+            terminators=terminator,
+        )
+        history = huggingface_to_gradio_message(history)
+        if tab_name is not None:
+            log_action(tab_name, "Show More of the Advisor’s Answer", "User continued the conversation")
+            log_action(tab_name, "Response", outputs_text)
+            # Update history for this tab
+            tab_data[tab_name]["history"] = history
+        if user_elicitation:
+            print(f"User Elicitation\nSystem Output: {outputs_text}")
+            log_action("User_Elicitation", "Response", outputs_text)
+            user_preference_elicitation_data["history"] = history
+        return history
+    def respond_evaluation(evals, tab_name):
+        # dropdown, readon_button, multi-evaluator
+        log_action(tab_name, "Round Evaluation", "Following")
+        for key, value in evals.items():
+            log_action(tab_name, key, value)
+        # Store the reason for this tab
+        tab_data[tab_name]["multi_evaluator"] = evals
+        return (
+            evals["selection"],
+            evals["reason"],
+            evals["trust"],
+            evals["satisfaction"],
+            evals["knowledgeable"],
+            evals["helpful"],
+        )
+    def respond_final_ranking(
+        first_comp,
+        ranking_first_comp,
+        second_comp,
+        ranking_second_comp,
+        third_comp,
+        ranking_third_comp,
+        fourth_comp,
+        ranking_fourth_comp,
+        fifth_comp,
+        ranking_fifth_comp,
+    ):
+        # make sure that they are not the same
+        ranking_list = [
+            ranking_first_comp,
+            ranking_second_comp,
+            ranking_third_comp,
+            ranking_fourth_comp,
+            ranking_fifth_comp,
+        ]
+        if len(set(ranking_list)) != len(ranking_list):
+            return """<div style="background-color: #fff3cd; color: #856404; padding: 15px; border: 1px solid #ffeeba; border-radius: 5px; margin-bottom: 20px;">
+                        <strong>Please make sure that you are not ranking the same stock multiple times.</strong>
+                    </div>"""
+        else:
+            log_action("Final_Ranking", first_comp, ranking_first_comp)
+            log_action("Final_Ranking", second_comp, ranking_second_comp)
+            log_action("Final_Ranking", third_comp, ranking_third_comp)
+            log_action("Final_Ranking", fourth_comp, ranking_fourth_comp)
+            log_action("Final_Ranking", fifth_comp, ranking_fifth_comp)
+            return """<div style="background-color: #d4edda; color: #155724; padding: 15px; border: 1px solid #c3e6cb; border-radius: 5px; margin-bottom: 20px;">
+                        <strong>Thank you for participating in the experiment. This concludes the session. You may now close the tab.</strong>
+                    </div>"""
+    def get_context(index):
+        comp = raw_context_list[index]["short_name"]
+        context = stock_context_list[index]
+        general_instruction, round_instruction = get_task_instruction_for_user(raw_context_list[index])
+        return comp, context, general_instruction, round_instruction
+    with gr.Blocks(title="RAG Chatbot Q&A", theme="Soft") as demo:
+        first_comp, first_context, first_general_instruction, first_round_instruction = get_context(0)
+        second_comp, second_context, second_general_instruction, second_round_instruction = get_context(1)
+        third_comp, third_context, third_general_instruction, third_round_instruction = get_context(2)
+        fourth_comp, fourth_context, forth_general_instruction, forth_round_instruction = get_context(3)
+        fifth_comp, fifth_context, fifth_general_instruction, fifth_round_instruction = get_context(4)
+        user_narrative = markdown.markdown(raw_context_list[0]["user_narrative"].replace("\n", "<br>"))
+        # # initialize tab data
+        for comp in [first_comp, second_comp, third_comp, fourth_comp, fifth_comp]:
+            tab_data[comp] = {"history": [], "selection": "", "reason": ""}
+        # EXperiment Instruction
+        with gr.Tab("Experiment Instruction") as instruction_tab:
+            gr.HTML(value=INSTRUCTION_PAGE, label="Experiment Instruction")
+        # User Preference Elicitation Tab
+        with gr.Tab("Preference Elicitation Stage") as preference_elicitation_tab:
+            user_preference_elicitation_tab = tab_creation_preference_stage()
+            click_control_preference_stage(user_preference_elicitation_tab)
+        with gr.Tab("Financial Decision Stage"):
+            # Experiment Tag
+            first_tab = tab_creation_exploration_stage(0)
+            click_control_exploration_stage(first_tab)
+            second_tab = tab_creation_exploration_stage(1)
+            click_control_exploration_stage(second_tab)
+            third_tab = tab_creation_exploration_stage(2)
+            click_control_exploration_stage(third_tab)
+            fourth_tab = tab_creation_exploration_stage(3)
+            click_control_exploration_stage(fourth_tab)
+            fifth_tab = tab_creation_exploration_stage(4)
+            click_control_exploration_stage(fifth_tab)
+        with gr.Tab("Final Evaluation Stage") as final_evaluation:
+            final_evaluation_tab = tab_final_evaluation(first_comp, second_comp, third_comp, fourth_comp, fifth_comp)
+            click_control_final_evaluation(final_evaluation_tab)
+    return demo
+if __name__ == "__main__":
+    login_to_huggingface(ACCESS)
+    file_path = os.path.join(ROOT_FILE, "./data/single_stock_data/single_stock_demo.jsonl")
+    context_info = get_context(file_path)  # str to List of Dict
+    # For Demo Usage, just use the first dict
+    context_info = context_info[0]
+    stock_context_list = build_context(context_info)  # List of str
+    raw_context_list = build_raw_context_list(context_info)  # List of str
+    # system instruction consist of Task, Personality, and Context
+    """
+    Personality
+    ["extroverted", "introverted"]
+    ["agreeable", "antagonistic"]
+    ["conscientious", "unconscientious"]
+    ["neurotic", "emotionally stable"]
+    ["open to experience", "closed to experience"]]
+    """
+    personality = [
+        "extroverted",
+        "agreeable",
+        "conscientious",
+        "emotionally stable",
+        "open to experience",
+    ]
+    personality_prompt = build_personality_prompt(personality)
+    system_instruction_without_context = SYSTEM_INSTRUCTION + "\n" + personality_prompt + "\n"
+    # if DEBUG:
+    #     tokenizer, terminator, model = "", "", ""
+    # else:
+    tokenizer = AutoTokenizer.from_pretrained(RESPONSE_GENERATOR)
+    tokenizer, terminator = prepare_tokenizer(tokenizer)
+    p
+    model = AutoModelForCausalLM.from_pretrained(
+        RESPONSE_GENERATOR,
+        torch_dtype=torch.float16,
+        pad_token_id=tokenizer.eos_token_id,
+    ).to(DEVICE)
+    demo = create_demo(
+        model, tokenizer, terminator, system_instruction_without_context, stock_context_list, raw_context_list
+    )
+    demo.launch(share=True)

experiments/single_stock_experiment.py ADDED Viewed

	@@ -0,0 +1,574 @@

+import subprocess
+import sys
+import os
+from components.induce_personality import (
+    construct_big_five_words,
+)
+# need to import: gradio
+def install(package, upgrade=False):
+    if upgrade:
+        subprocess.run(
+            [
+                sys.executable,
+                "-m",
+                "pip",
+                "install",
+                "--upgrade",
+                package,
+            ],
+            check=True,
+        )
+    else:
+        subprocess.run(
+            [
+                sys.executable,
+                "-m",
+                "pip",
+                "install",
+                package,
+            ],
+            check=True,
+        )
+# install("ipdb")
+# install("gradio")
+# install("sentence-transformers")
+# install("git+https://github.com/terrierteam/pyterrier_t5.git")
+# install("protobuf")
+# install("transformers", upgrade=True)
+import random
+import json
+import gradio as gr
+import random
+import time
+import ipdb
+import markdown
+import gradio as gr
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+from utils import login_to_huggingface, ACCESS
+from components.rag_components import (
+    rag,
+    retrieve_passage,
+    response_generation,
+)
+from components.rewrite_passages import rewrite_rag_context
+from components.query_rewriting import rewrite_query
+from components.chat_conversation import (
+    format_message_history,
+    format_user_message,
+    format_context,
+    gradio_to_huggingface_message,
+    huggingface_to_gradio_message,
+    get_system_instruction,
+    prepare_tokenizer,
+    format_rag_context,
+)
+from components.constant import (
+    ACCESS,
+    QUERY_REWRITING,
+    RAG,
+    PERSONALITY,
+    PERSONALITY_LIST,
+    REWRITE_PASSAGES,
+    NUM_PASSAGES,
+    DEVICE,
+    RESPONSE_GENERATOR,
+)
+from components.induce_personality import (
+    build_personality_prompt,
+)
+# LOG_FILE = "log_file_bingzhi_information_seeking.txt"
+ROOT_FILE = os.path.dirname(os.path.abspath(__file__))
+LOG_DIR = os.path.join(ROOT_FILE, "log/single_stock_experiment/othres/")
+if os.path.exists(LOG_DIR) is False:
+    os.makedirs(LOG_DIR)
+STATIC_FILE = os.path.join("_static")
+with open(os.path.join(STATIC_FILE, "html/instruction_page.html"), "r") as f:
+    INSTRUCTION_PAGE = f.read()
+with open(os.path.join(STATIC_FILE, "html/evaluation_instruction.html"), "r") as f:
+    EVALUATION_INSTRUCTION = f.read()
+with open(os.path.join(STATIC_FILE, "txt/general_instruction_task.txt"), "r") as f:
+    GENERAL_INSTRUCTION_TASK = f.read()
+with open(os.path.join(STATIC_FILE, "txt/general_instruction_button.txt"), "r") as f:
+    GENERAL_INSTRUCTION_BUTTON = f.read()
+with open(os.path.join(STATIC_FILE, "txt/system_instruction.txt"), "r") as f:
+    SYSTEM_INSTRUCTION = f.read()
+FIRST_MESSAGE = "Hey"
+INFORMATION_SEEKING = True
+DEBUG = False
+def get_context(synthetic_data_path):
+    # Load data from the synthetic data file
+    with open(synthetic_data_path, "r") as f:
+        data = [json.loads(line) for line in f]
+    return data
+def add_ticker_prefix(ticker_list, context_list):
+    res = []
+    for ticker, context in zip(ticker_list, context_list):
+        res.append(f"{ticker}: {context}")
+    return res
+def build_raw_context_list(context_dict):
+    return context_dict["data"]
+def build_context(context_dict):
+    return [build_context_element(context) for context in context_dict["data"]]
+def build_context_element(context):
+    # [{topic: ex, data: {}}, {..}, ..]
+    # Extract information from the context
+    ticker = context["ticker"]
+    sector = context["sector"]
+    business_summary = context["business_summary"]
+    name = context["short_name"]
+    stock_price = context["price_data"]
+    earning = context["earning_summary"]
+    beta = context["beta"]
+    # Build the context string
+    stock_candidate = f"Stock Candidate: {name}"
+    stock_info = f"Stock Information: \nIndustry - {sector}, \nBeta (risk indicator) - {beta}, \nEarning Summary - {earning}\n, 2023 Monthly Stock Price - {stock_price}\n, Business Summary - {business_summary}"
+    context_list = [stock_candidate, stock_info]
+    # Combine all parts into a single string
+    return "\n".join(context_list)
+def get_task_instruction_for_user(context):
+    ticker_name = context["short_name"]
+    user_narrative = context["user_narrative"]
+    user_narrative = user_narrative.replace("\n", "<br>")
+    html_user_narrative = markdown.markdown(user_narrative)
+    general_instruction = f"""<!-- Grouped Container for Task Instruction and Stock Information -->
+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <!-- Heading -->
+    <h2 style="color: #2c3e50; text-align: center; margin-bottom: 20px; font-size: 20px; font-weight: 600;">
+        General Instruction
+    </h2>
+    <!-- User Instruction -->
+    <p style="text-align: left; font-size: 16px; color: #34495e; margin-bottom: 20px;">
+        {GENERAL_INSTRUCTION_TASK}
+        {GENERAL_INSTRUCTION_BUTTON}
+    </p>
+</div>"""
+    round_instruction = f"""
+<div style="background-color: #f9f9f9; padding: 20px; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1); margin-bottom: 20px; max-height: 780px; overflow-y: auto; overflow-x: hidden;">
+    <!-- Stock Information (Bold label, Normal ticker name) -->
+    <h2 style="color: #2c3e50; text-align: center; margin-bottom: 20px; font-size: 20px; font-weight: 600;">
+        Round Info
+    </h2>
+    <div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+        Stock
+    </div>
+    <div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+        <span style="font-weight: bold;">
+            This Round's Stock:
+        </span>
+        {ticker_name}
+    </div>
+    <!-- User Narrative (Bold label, Normal narrative) -->
+    <div style="text-align: left; font-size: 20px; font-weight: bold; margin-bottom: 20px;">
+        User Narrative
+    </div>
+    <div style="text-align: left; font-weight: normal; font-size: 16px; margin-bottom: 20px;">
+        {html_user_narrative}
+    </div>
+</div>"""
+    return general_instruction, round_instruction
+def display_system_instruction_with_html(
+    system_instruction,
+):
+    html_system_instruction = f"""
+        <p style="text-align: left; margin-bottom: 10px;">
+            {system_instruction}
+        </p>
+    """
+    return html_system_instruction
+def create_demo(
+    model,
+    tokenizer,
+    terminator,
+    system_description_without_context,
+    stock_context_list,
+    raw_context_list,
+):
+    # Store the history here and use this as an input to each tab.
+    tab_data = {}
+    tab_gradio = {}
+    def tab_creation(order):
+        comp, contex, general_instruction, round_instruction = get_context(order)
+        system_instruction = system_description_without_context + "\n" + contex
+        tab_data[comp] = {"history": [], "selection": "", "reason": ""}
+        english_order = ["First", "Second", "Third", "Fourth", "Fifth"]
+        with gr.Tab(f"{english_order[order]}: {comp}") as tab:
+            with gr.Tab("Interaction with a Financial Advisor"):
+                gr.HTML(value=general_instruction, label="General Instruction")
+                with gr.Row():
+                    with gr.Column():
+                        with gr.Row():
+                            gr.HTML(
+                                value=round_instruction,
+                                label="Round Instruction",
+                            )
+                    with gr.Column():
+                        with gr.Row():
+                            chatbot = gr.Chatbot(height=600)
+                        with gr.Row():
+                            start_conversation = gr.Button(value="Start Conversation")
+                        with gr.Row():
+                            msg = gr.Textbox(scale=1, label="Input: User Input")
+                        with gr.Row():
+                            msg_button = gr.Button(value="Send: User Input", interactive=False)
+                            continue_button = gr.Button(value="Continue", interactive=False)
+                with gr.Row():
+                    clear = gr.ClearButton([msg, chatbot])
+                # if DEBUG:
+                with gr.Row():
+                    display_prompt = gr.HTML(
+                        value=display_system_instruction_with_html(system_instruction),
+                        label="System Instruction",
+                    )
+            with gr.Tab("Evaluation"):
+                with gr.Row():
+                    gr.HTML(value=EVALUATION_INSTRUCTION)
+                with gr.Row():
+                    dropdown = gr.Dropdown(
+                        label="Decision Making",
+                        choices=["Purchase", "Not Purchase"],
+                        show_label=True,
+                    )
+                    reason = gr.Textbox(scale=1, label="The reason of your choice")
+                with gr.Row():
+                    trust = gr.Slider(
+                        label="Trust",
+                        minimum=1,
+                        maximum=100,
+                        value=50,
+                        info="How much do you trust the financial advisor? Answer from 1 to 100.",
+                        step=1,
+                    )
+                    satisfaction = gr.Slider(
+                        label="Satisfaction",
+                        minimum=1,
+                        maximum=100,
+                        value=50,
+                        info="How satisfied are you with the financial advisor? Answer from 1 to 100.",
+                        step=1,
+                    )
+                with gr.Row():
+                    knowledgeable = gr.Slider(
+                        label="Knowledgeable",
+                        minimum=1,
+                        maximum=100,
+                        value=50,
+                        info="How knowledgeable do you feel after interacting with the financial advisor? Answer from 1 to 100.",
+                        step=1,
+                    )
+                    helpful = gr.Slider(
+                        label="Helpful",
+                        minimum=1,
+                        maximum=100,
+                        value=50,
+                        info="How helpful do you find the financial advisor? Answer from 1 to 100.",
+                        step=1,
+                    )
+                evaluation_send_button = gr.Button(value="Send: Evaluation")
+            return {
+                "comp": comp,
+                "system_instruction": system_instruction,
+                "start_conversation": start_conversation,
+                "msg_button": msg_button,
+                "continue_button": continue_button,
+                "chatbot": chatbot,
+                "msg": msg,
+                "dropdown": dropdown,
+                "reason": reason,
+                "trust": trust,
+                "satisfaction": satisfaction,
+                "knowledgeable": knowledgeable,
+                "helpful": helpful,
+                "evaluation_send_button": evaluation_send_button,
+            }
+    def click_control(tabs):
+        (
+            comp,
+            system_instruction,
+            start_conversation,
+            msg_button,
+            continue_button,
+            chatbot,
+            msg,
+            dropdown,
+            reason,
+            trust,
+            satisfaction,
+            knowledgeable,
+            helpful,
+            evaluation_send_button,
+        ) = (
+            tabs["comp"],
+            tabs["system_instruction"],
+            tabs["start_conversation"],
+            tabs["msg_button"],
+            tabs["continue_button"],
+            tabs["chatbot"],
+            tabs["msg"],
+            tabs["dropdown"],
+            tabs["reason"],
+            tabs["trust"],
+            tabs["satisfaction"],
+            tabs["knowledgeable"],
+            tabs["helpful"],
+            tabs["evaluation_send_button"],
+        )
+        start_conversation.click(
+            lambda history: respond_start_conversation(history, system_instruction, comp),
+            [chatbot],
+            [chatbot, start_conversation, msg_button, continue_button],
+        )
+        msg_button.click(
+            lambda message, history: respond(message, tab_data[comp]["history"], system_instruction, comp),
+            [msg, chatbot],
+            [msg, chatbot],
+        )
+        continue_button.click(
+            lambda history: respond_continue(tab_data[comp]["history"], system_instruction, comp),
+            [chatbot],
+            [chatbot],
+        )
+        evaluation_send_button.click(
+            lambda dropdown, reason, trust, satisfaction, knowledgeable, helpful: respond_evaluation(
+                {
+                    "selection": dropdown,
+                    "reason": reason,
+                    "trust": trust,
+                    "satisfaction": satisfaction,
+                    "knowledgeable": knowledgeable,
+                    "helpful": helpful,
+                },
+                comp,
+            ),
+            [dropdown, reason, trust, satisfaction, knowledgeable, helpful],
+            [dropdown, reason, trust, satisfaction, knowledgeable, helpful],
+        )
+    def log_action(tab_name, action, details):
+        """
+        Log actions for each tab (stock).
+        """
+        log_file = os.path.join(LOG_DIR, f"{tab_name}.txt")
+        with open(log_file, "a") as f:
+            f.write(f"Action: {action} | Details: {details}\n")
+    def respond(message, history, system_instruction, tab_name):
+        """
+        Return:
+        msg
+        chat_history
+        retrieved_passage
+        rewritten_query
+        """
+        # Formatting Input
+        print(f"User Message: {message} in Tab: {tab_name}")
+        history = gradio_to_huggingface_message(history)
+        history = format_context(system_instruction, history)
+        history_with_user_utterance = format_user_message(message, history)
+        outputs_text, history = response_generation(
+            history_with_user_utterance,
+            model,
+            tokenizer,
+            max_tokens=128,
+            device=DEVICE,
+            terminators=terminator,
+        )
+        # Format
+        history = huggingface_to_gradio_message(history)
+        print(f"Tab: {tab_name}\nHistory: {history}")
+        # Log the user message and response
+        log_action(tab_name, "User Message", message)
+        log_action(tab_name, "Response", outputs_text)
+        # Store the updated history for this tab
+        tab_data[tab_name]["history"] = history
+        return "", history
+    def respond_start_conversation(history, system_instruction, tab_name):
+        history = gradio_to_huggingface_message(history)
+        history = format_context(system_instruction, history)
+        first_message = FIRST_MESSAGE
+        history_with_user_utterance = format_user_message(first_message, history)
+        outputs_text, history = response_generation(
+            history_with_user_utterance,
+            model,
+            tokenizer,
+            max_tokens=128,
+            device=DEVICE,
+            terminators=terminator,
+        )
+        # Format
+        history = huggingface_to_gradio_message(history)
+        print(f"Tab: {tab_name}\nHistory: {history}")
+        # Log the user message and response
+        log_action(tab_name, "User Message", first_message)
+        log_action(tab_name, "Response", outputs_text)
+        # Store the updated history for this tab
+        tab_data[tab_name]["history"] = history
+        return (
+            history,
+            gr.Button(value="Start Conversation", interactive=False),
+            gr.Button(value="Send: User Input", interactive=True),
+            gr.Button(value="Continue", interactive=True),
+        )
+    def respond_continue(history, system_instruction, tab_name):
+        message = "continue"
+        history = gradio_to_huggingface_message(history)
+        history = format_context(system_instruction, history)
+        history_with_user_utterance = format_user_message(message, history)
+        outputs_text, history = response_generation(
+            history_with_user_utterance,
+            model,
+            tokenizer,
+            max_tokens=128,
+            device=DEVICE,
+            terminators=terminator,
+        )
+        history = huggingface_to_gradio_message(history)
+        log_action(tab_name, "Continue", "User continued the conversation")
+        log_action(tab_name, "Response", outputs_text)
+        # Update history for this tab
+        tab_data[tab_name]["history"] = history
+        return history
+    def respond_evaluation(evals, tab_name):
+        # dropdown, readon_button, multi-evaluator
+        log_action(tab_name, "Round Evaluation", "Following")
+        for key, value in evals.items():
+            log_action(tab_name, key, value)
+        # Store the reason for this tab
+        tab_data[tab_name]["multi_evaluator"] = evals
+        return (
+            evals["selection"],
+            evals["reason"],
+            evals["trust"],
+            evals["satisfaction"],
+            evals["knowledgeable"],
+            evals["helpful"],
+        )
+    def get_context(index):
+        comp = raw_context_list[index]["short_name"]
+        context = stock_context_list[index]
+        general_instruction, round_instruction = get_task_instruction_for_user(raw_context_list[index])
+        return comp, context, general_instruction, round_instruction
+    with gr.Blocks(title="RAG Chatbot Q&A", theme="Soft") as demo:
+        first_comp, first_context, first_general_instruction, first_round_instruction = get_context(0)
+        second_comp, second_context, second_general_instruction, second_round_instruction = get_context(1)
+        third_comp, third_context, third_general_instruction, third_round_instruction = get_context(2)
+        fourth_comp, fourth_context, forth_general_instruction, forth_round_instruction = get_context(3)
+        fifth_comp, fifth_context, fifth_general_instruction, fifth_round_instruction = get_context(4)
+        first_system_instruction = system_description_without_context + "\n" + first_context
+        second_system_instruction = system_description_without_context + "\n" + second_context
+        third_system_instruction = system_description_without_context + "\n" + third_context
+        fourth_system_instruction = system_description_without_context + "\n" + fourth_context
+        fifth_system_instruction = system_description_without_context + "\n" + fifth_context
+        # # initialize tab data
+        for comp in [first_comp, second_comp, third_comp, fourth_comp, fifth_comp]:
+            tab_data[comp] = {"history": [], "selection": "", "reason": ""}
+        # EXperiment Instruction
+        with gr.Tab("Experiment Instruction") as instruction_tab:
+            gr.HTML(value=INSTRUCTION_PAGE, label="Experiment Instruction")
+        # Experiment Tag
+        first_tab = tab_creation(0)
+        click_control(first_tab)
+        second_tab = tab_creation(1)
+        click_control(second_tab)
+        third_tab = tab_creation(2)
+        click_control(third_tab)
+        fourth_tab = tab_creation(3)
+        click_control(fourth_tab)
+        fifth_tab = tab_creation(4)
+        click_control(fifth_tab)
+    return demo
+if __name__ == "__main__":
+    login_to_huggingface(ACCESS)
+    file_path = os.path.join(ROOT_FILE, "./data/single_stock_data/single_stock_demo.jsonl")
+    context_info = get_context(file_path)  # str to List of Dict
+    # For Demo Usage, just use the first dict
+    context_info = context_info[0]
+    stock_context_list = build_context(context_info)  # List of str
+    raw_context_list = build_raw_context_list(context_info)  # List of str
+    # system instruction consist of Task, Personality, and Context
+    """
+    Personality
+    ["extroverted", "introverted"]
+    ["agreeable", "antagonistic"]
+    ["conscientious", "unconscientious"]
+    ["neurotic", "emotionally stable"]
+    ["open to experience", "closed to experience"]]
+    """
+    personality = [
+        "extroverted",
+        "agreeable",
+        "conscientious",
+        "emotionally stable",
+        "open to experience",
+    ]
+    personality_prompt = build_personality_prompt(personality)
+    system_instruction_without_context = SYSTEM_INSTRUCTION + "\n" + personality_prompt + "\n"
+    if DEBUG:
+        tokenizer, terminator, model = "", "", ""
+    else:
+        tokenizer = AutoTokenizer.from_pretrained(RESPONSE_GENERATOR)
+        tokenizer, terminator = prepare_tokenizer(tokenizer)
+        model = AutoModelForCausalLM.from_pretrained(
+            RESPONSE_GENERATOR,
+            torch_dtype=torch.float16,
+            pad_token_id=tokenizer.eos_token_id,
+        ).to(DEVICE)
+    demo = create_demo(
+        model, tokenizer, terminator, system_instruction_without_context, stock_context_list, raw_context_list
+    )
+    demo.launch(share=True)

requirements.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+transformers==4.44.1
+together==1.3.0
+markdown==3.4.1

user_feedback/interaction_3a48b93b-0de7-4e2a-b779-8f1f0c27af24_first.json ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ {"user_id": "demo_3_0_0", "uuid": "3a48b93b-0de7-4e2a-b779-8f1f0c27af24", "timestamp": "2024-10-23 17:14:02", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
2	+ {"user_id": "demo_3_0_0", "uuid": "3a48b93b-0de7-4e2a-b779-8f1f0c27af24", "timestamp": "2024-10-23 17:14:02", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "What brings you here today? Are you looking to start investing or reassess your current portfolio?"}}

user_feedback/interaction_462c2c52-b14f-44f1-8030-6f06d5a7d925_first.json ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ {"user_id": "demo_3_0_0", "uuid": "462c2c52-b14f-44f1-8030-6f06d5a7d925", "timestamp": "2024-10-23 17:15:17", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
2	+ {"user_id": "demo_3_0_0", "uuid": "462c2c52-b14f-44f1-8030-6f06d5a7d925", "timestamp": "2024-10-23 17:15:17", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "What brings you here today? Are you looking to start investing or reassess your current portfolio?"}}

user_feedback/interaction_7017b92d-6932-4d3a-b189-1267c2386995_first.json ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ {"user_id": "demo_0_0_0", "uuid": "7017b92d-6932-4d3a-b189-1267c2386995", "timestamp": "2024-10-23 17:19:10", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
2	+ {"user_id": "demo_0_0_0", "uuid": "7017b92d-6932-4d3a-b189-1267c2386995", "timestamp": "2024-10-23 17:19:10", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Welcome to our financial planning session. I'm excited to help you create a personalized investment strategy. To get started, let's talk about your preferred industry for investment. Are you interested in investing in a specific sector, such as technology, healthcare, finance, energy, consumer goods, or something else?"}}

user_feedback/interaction_7e25ac2e-3849-4817-9ae3-e883bca2fb10_first.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{"user_id": "demo_3_0_0", "uuid": "7e25ac2e-3849-4817-9ae3-e883bca2fb10", "timestamp": "2024-10-23 17:05:19", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
+{"user_id": "demo_3_0_0", "uuid": "7e25ac2e-3849-4817-9ae3-e883bca2fb10", "timestamp": "2024-10-23 17:05:19", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "What can I help you with today? You're looking to discuss your investment options, I assume?"}}
+{"user_id": "demo_3_0_0", "uuid": "7e25ac2e-3849-4817-9ae3-e883bca2fb10", "timestamp": "2024-10-23 17:05:32", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "yes"}}
+{"user_id": "demo_3_0_0", "uuid": "7e25ac2e-3849-4817-9ae3-e883bca2fb10", "timestamp": "2024-10-23 17:05:32", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Let's start with the basics. What type of industry or sector are you interested in investing in? Are you drawn to technology, healthcare, finance, or something else?"}}

user_feedback/interaction_8611c342-840f-4529-b9ff-d1dabb754ded_first.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{"user_id": "demo_2_2_0", "uuid": "8611c342-840f-4529-b9ff-d1dabb754ded", "timestamp": "2024-10-23 17:00:59", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
+{"user_id": "demo_2_2_0", "uuid": "8611c342-840f-4529-b9ff-d1dabb754ded", "timestamp": "2024-10-23 17:00:59", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "It's great to meet you! I'm thrilled to help you with your investment goals. Let's get started. To begin, I'd love to know, what industries interest you the most? Are you drawn to technology, healthcare, finance, or perhaps something else?"}}
+{"user_id": "demo_2_2_0", "uuid": "8611c342-840f-4529-b9ff-d1dabb754ded", "timestamp": "2024-10-23 17:03:47", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "I am interested in healthcare "}}
+{"user_id": "demo_2_2_0", "uuid": "8611c342-840f-4529-b9ff-d1dabb754ded", "timestamp": "2024-10-23 17:03:47", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Healthcare is a fantastic sector with a lot of growth potential. It's also a sector that tends to be less volatile, which can be appealing to some investors. What specifically within healthcare interests you the most? Are you drawn to pharmaceuticals, medical devices, or perhaps healthcare services?"}}
+{"user_id": "demo_2_2_0", "uuid": "8611c342-840f-4529-b9ff-d1dabb754ded", "timestamp": "2024-10-23 17:04:27", "type": "interaction", "value": {"type": "Bank of America Corporation", "role": "user", "content": "Hey"}}
+{"user_id": "demo_2_2_0", "uuid": "8611c342-840f-4529-b9ff-d1dabb754ded", "timestamp": "2024-10-23 17:04:27", "type": "interaction", "value": {"type": "Bank of America Corporation", "role": "assistant", "content": "I'm so glad you're here! I've got some exciting information to share with you about a potential investment opportunity. Today, we're going to explore Bank of America Corporation, a well-established player in the financial services industry. As a customer who's interested in various sectors, I think you'll find this one fascinating.\n\nBank of America operates in four main segments: Consumer Banking, Global Wealth & Investment Management, Global Banking, and Global Markets. They offer a wide range of products and services, from banking and lending to investment and wealth management. What I think you'll appreciate is that their Consumer Banking segment focuses on serving individual consumers, which aligns with your interest in various sectors.\n\nHowever, I do want to mention that Bank of America operates in the financial services industry, which can be quite volatile. Their beta, a measure of risk, is 1.338, indicating that their stock price can be more sensitive to market fluctuations. What would you like to know more about this potential investment opportunity?"}}

user_feedback/interaction_8e1566fb-6de9-46da-a3de-c6a580fb5b83_first.json ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ {"user_id": "demo_3_0_0", "uuid": "8e1566fb-6de9-46da-a3de-c6a580fb5b83", "timestamp": "2024-10-23 17:15:46", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
2	+ {"user_id": "demo_3_0_0", "uuid": "8e1566fb-6de9-46da-a3de-c6a580fb5b83", "timestamp": "2024-10-23 17:15:46", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "What can I help you with today? You're looking to discuss your investment strategy, I assume?"}}

user_feedback/interaction_abfb0425-8dff-4b63-91d0-372276758a8f_first.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{"user_id": "demo_1_1_0", "uuid": "abfb0425-8dff-4b63-91d0-372276758a8f", "timestamp": "2024-10-23 17:20:21", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
+{"user_id": "demo_1_1_0", "uuid": "abfb0425-8dff-4b63-91d0-372276758a8f", "timestamp": "2024-10-23 17:20:21", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Welcome to our financial planning session. I'm here to help you make informed investment decisions. To get started, let's discuss your preferred industry for investment. Are you interested in investing in a specific sector, such as technology, healthcare, finance, energy, consumer goods, or something else?"}}
+{"user_id": "demo_1_1_0", "uuid": "abfb0425-8dff-4b63-91d0-372276758a8f", "timestamp": "2024-10-23 17:20:55", "type": "interaction", "value": {"type": "Walmart Inc.", "role": "user", "content": "Hey"}}
+{"user_id": "demo_1_1_0", "uuid": "abfb0425-8dff-4b63-91d0-372276758a8f", "timestamp": "2024-10-23 17:20:55", "type": "interaction", "value": {"type": "Walmart Inc.", "role": "assistant", "content": "Welcome to our financial advisory session. I'm here to help you explore the details of a specific stock, Walmart Inc. (WMT). Before we dive in, I'd like to give you a brief overview of the company. Walmart is a multinational retail corporation that operates a wide range of stores, including supercenters, supermarkets, and e-commerce platforms. They offer a vast array of products, from groceries and electronics to clothing and home goods. They also provide various services, such as pharmacy, optical, and financial services.\n\nNow, what would you like to know more about Walmart Inc.? Would you like to explore their financial performance, business operations, or something else?"}}

user_feedback/interaction_b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea_first.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:16:41", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:16:41", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "What can I help you with today? We're going to discuss your investment preferences. Let's start with the industry. Are you interested in investing in a specific sector, such as technology, healthcare, finance, or something else?"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:16:55", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "I am interested in healthcare"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:16:55", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Healthcare is a stable industry with a strong demand for services. What aspect of healthcare are you most interested in? Pharmaceuticals, medical devices, hospitals, or perhaps biotechnology?"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:17:06", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "I do not have preference on that"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:17:06", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "So you're open to various sub-sectors within healthcare. That's a broad and diverse field. Next, let's discuss the type of stocks you're interested in. Are you looking for value stocks, which are often undervalued and have the potential for long-term growth, or growth stocks, which are expected to experience rapid expansion?"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:17:28", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "What are the differences?"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:17:28", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Value stocks are typically undervalued by the market, meaning their price is lower than their intrinsic value. They often have a history of stable earnings and a strong financial foundation. Growth stocks, on the other hand, are expected to experience rapid expansion in revenue and earnings, but may be more volatile. They often have a higher growth potential, but also come with higher risks. Think of it like buying a house: value stocks are like a stable, established home, while growth stocks are like a new, rapidly expanding development."}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:17:36", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "I like growth stock"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:17:36", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Growth stocks can be more exciting, but also come with higher risks. They often require a higher tolerance for volatility. Next, let's discuss dividends. Are you interested in investing in stocks that pay dividends, providing a regular income stream, or non-dividend stocks, which focus on capital appreciation?"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:17:47", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Any recommendations for that"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:17:47", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "I'm not here to recommend specific stocks yet. This conversation is about your preferences. We'll discuss specific stocks in the next session. For now, I just need to understand your preference. Do you want dividend-paying stocks for regular income or non-dividend stocks for potential long-term growth?"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:18:00", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "I want dividend stock"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:18:00", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Dividend stocks can provide a steady income stream. However, keep in mind that they often come with lower growth potential compared to non-dividend stocks. Next, let's discuss the type of stocks that are less affected by economic downturns. Are you interested in cyclical stocks, which are closely tied to the overall economy and can be more volatile, or non-cyclical stocks, which are less affected by economic fluctuations?"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:18:09", "type": "Interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Probably non-cyclical one"}}
+{"user_id": "demo_3_0_0", "uuid": "b8b1504f-a952-4c9c-b6b1-febdb3ffd6ea", "timestamp": "2024-10-23 17:18:09", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Non-cyclical stocks tend to be more stable and less affected by economic downturns. They often provide a steady income stream and can be a good fit for investors seeking lower volatility. I think we've covered the main points. Thank you for the conversation, please move on to the next section."}}

user_feedback/interaction_d34ca619-e30a-4267-9538-cc8f99aff079.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{"user_id": "demo_3_2_4", "uuid": "d34ca619-e30a-4267-9538-cc8f99aff079", "timestamp": "2024-10-23 12:02:59", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
+{"user_id": "demo_3_2_4", "uuid": "d34ca619-e30a-4267-9538-cc8f99aff079", "timestamp": "2024-10-23 12:02:59", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "Welcome to our financial planning session. I'm here to help you understand your investment preferences. Let's start with the first topic: preferred industries. Are you interested in investing in a specific industry, such as technology, healthcare, finance, or something else?"}}
+{"user_id": "demo_3_2_4", "uuid": "d34ca619-e30a-4267-9538-cc8f99aff079", "timestamp": "2024-10-23 12:03:07", "type": "interaction", "value": {"type": "Apple Inc.", "role": "user", "content": "Hey"}}
+{"user_id": "demo_3_2_4", "uuid": "d34ca619-e30a-4267-9538-cc8f99aff079", "timestamp": "2024-10-23 12:03:07", "type": "interaction", "value": {"type": "Apple Inc.", "role": "assistant", "content": "Apple Inc. is a technology company that designs and manufactures a wide range of products, including iPhones, Mac computers, and wearables. They also offer various services, such as Apple Music and Apple Pay. Given your profile, I notice that you don't have any specific industry preferences, which makes Apple a good fit in that regard. However, as a technology company, Apple is considered a growth stock, and its beta is 1.239, indicating a relatively high level of volatility. This might be a concern for some investors. What would you like to know more about Apple's performance and prospects?"}}

user_feedback/interaction_e7f30c05-4668-4b35-a706-ba27b7c0a0a9_first.json ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ {"user_id": "demo_2_2_0", "uuid": "e7f30c05-4668-4b35-a706-ba27b7c0a0a9", "timestamp": "2024-10-23 17:13:16", "type": "interaction", "value": {"type": "user_elicitation", "role": "user", "content": "Hey"}}
2	+ {"user_id": "demo_2_2_0", "uuid": "e7f30c05-4668-4b35-a706-ba27b7c0a0a9", "timestamp": "2024-10-23 17:13:16", "type": "Interaction", "value": {"type": "user_elicitation", "role": "assistant", "content": "It's great to meet you! I'm excited to help you with your investment goals. Let's get started. What kind of industry or sector are you most interested in investing in? Are you drawn to technology, healthcare, finance, or something else?"}}

user_feedback/summarization_8611c342-840f-4529-b9ff-d1dabb754ded_first.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"user_id": "demo_2_2_0", "uuid": "8611c342-840f-4529-b9ff-d1dabb754ded", "timestamp": "2024-10-23 17:04:25", "type": "preference_elicitation_summarization", "value": {"summarization": "Based on the previous conversation, here's a summary of the customer's investment preferences:\n\n1. **Preferred Industries:** Healthcare\n2. **Value vs. Growth Stocks:** Not discussed\n3. **Dividend vs. Non-Dividend Stocks:** Not discussed\n4. **Cyclical vs. Non-Cyclical Stocks:** Not discussed"}}

user_feedback/summarization_d34ca619-e30a-4267-9538-cc8f99aff079.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"user_id": "demo_3_2_4", "uuid": "d34ca619-e30a-4267-9538-cc8f99aff079", "timestamp": "2024-10-23 12:03:05", "type": "preference_elicitation_summarization", "value": {"summarization": "Unfortunately, I don't have any information about a previous conversation with a customer. However, I can provide a summary based on the given conversation snippet.\n\nPreferred Industries: The customer has not expressed a preference for a specific industry.\n\nValue vs. Growth Stocks: Not discussed.\n\nDividend vs. Non-Dividend Stocks: Not discussed.\n\nCyclical vs. Non-Cyclical Stocks: Not discussed."}}