Spaces:

hydraadra112
/

SciDocuParse

Sleeping

App Files Files Community

hydraadra112 commited on Apr 10

Commit

55c4810

0 Parent(s):

Created streamlit platform for SciDocuParse

Browse files

Files changed (7) hide show

.gitattributes +37 -0
.gitignore +174 -0
README.md +14 -0
SciDocuParse.py +60 -0
playground.ipynb +159 -0
requirements.txt +4 -0
utils.py +64 -0

.gitattributes ADDED Viewed

	@@ -0,0 +1,37 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+assets/logoJPG.jpg filter=lfs diff=lfs merge=lfs -text
+assets/logo_trans.png filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,174 @@

+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+# C extensions
+*.so
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+# Translations
+*.mo
+*.pot
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+# Flask stuff:
+instance/
+.webassets-cache
+# Scrapy stuff:
+.scrapy
+# Sphinx documentation
+docs/_build/
+# PyBuilder
+.pybuilder/
+target/
+# Jupyter Notebook
+.ipynb_checkpoints
+# IPython
+profile_default/
+ipython_config.py
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+# UV
+#   Similar to Pipfile.lock, it is generally recommended to include uv.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#uv.lock
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
+.pdm.toml
+.pdm-python
+.pdm-build/
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+# SageMath parsed files
+*.sage.py
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+# Spyder project settings
+.spyderproject
+.spyproject
+# Rope project settings
+.ropeproject
+# mkdocs documentation
+/site
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+# Pyre type checker
+.pyre/
+# pytype static type analyzer
+.pytype/
+# Cython debug symbols
+cython_debug/
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/
+# Ruff stuff:
+.ruff_cache/
+# PyPI configuration file
+.pypirc

README.md ADDED Viewed

	@@ -0,0 +1,14 @@

+---
+title: SciDocuParse
+emoji: 🏆
+colorFrom: yellow
+colorTo: yellow
+sdk: streamlit
+sdk_version: 1.43.2
+app_file: app.py
+pinned: false
+license: mit
+short_description: A scientific document graph interpreter & analyzer
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

SciDocuParse.py ADDED Viewed

	@@ -0,0 +1,60 @@

+import streamlit as st
+from utils import get_api_key, get_response
+def main():
+    st.header('Welcome to SciDocuParse! 🧑‍🔬📚')
+    st.write('A scientific document parser, particularly specializing in graph analysis 📊 and data interpretation 🔍.')
+    st.session_state["thought_process"] = ""
+    st.session_state["response"] = ""
+    with st.sidebar:
+        st.header('SciDocuParse Sidebar 🔧')
+        st.caption('A tool to help you analyze scientific papers and documents efficiently! 📝')
+        paper = st.text_area('Paste scientific document citation here 🧑‍🏫',
+                                        """@article{wang2020automated,
+        title={Automated diabetic retinopathy grading and lesion detection based on the modified R-FCN object-detection algorithm},
+        author={Wang, Jialiang and Luo, Jianxu and Liu, Bin and Feng, Rui and Lu, Lina and Zou, Haidong},
+        journal={IET Computer Vision},
+        volume={14},
+        number={1},
+        pages={1--8},
+        year={2020},
+        publisher={Wiley Online Library}
+        }""", height=350, help='Paste your document citation in BiBtex format.')
+        if not paper:
+            st.error('Provide a citation first! ⚠️')
+        user_prompt = st.text_area("Enter your query for analysis 🔍:",
+                                    "Summarize this document and highlight key findings in graphs 📈")
+        persona = "You are a master Scientific Graph Analyzer skilled in interpreting graphs across all fields. Analyze trends (linear/exponential growth, correlations, outliers) and statistical patterns (mean, variance). Summarize key findings in plain language, Expalin data about causality, anomalies, or data limitations. Prioritize clarity: ensure outputs are accessible to technical and non-technical audiences. Combine technical precision with intuitive communication to deliver accurate, user-friendly interpretations."
+        user_prompt = persona + paper + user_prompt
+        # api_key = get_api_key()
+        if st.button('Analyze with LLM 🚀'):
+            with st.spinner('Processing your document...'):
+                api_key = get_api_key()
+                thought_process, response = get_response(user_prompt, api_key) # uncommenting it to save tokens
+                st.session_state["thought_process"] = thought_process
+                st.session_state["response"] = response
+    if "thought_process" in st.session_state and "response" in st.session_state:
+        if len(st.session_state["thought_process"]) >= 1 and len(st.session_state["response"]) >= 1:
+            with st.expander('Show thought process 💭'):
+                st.caption(thought_process)
+            st.subheader('RESPONSE 📝')
+            st.write(response)
+    st.caption('SciDocuParse is made by John Manuel Carado')
+    st.caption('Intelligent Systems course in WVSU - CICT, Midterm Requirement')
+if __name__ == '__main__':
+    main()

playground.ipynb ADDED Viewed

	@@ -0,0 +1,159 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import re\n",
+    "from dotenv import load_dotenv\n",
+    "from typing import Tuple\n",
+    "from groq import Groq"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "load_dotenv()\n",
+    "api_key = os.getenv('key')\n",
+    "\n",
+    "prompt = 'How to get your first paper published?'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "client = Groq(api_key=api_key)\n",
+    "completion = client.chat.completions.create(\n",
+    "    model=\"deepseek-r1-distill-llama-70b\",\n",
+    "    messages=[\n",
+    "        {\n",
+    "            'role': 'user',\n",
+    "            'content': prompt\n",
+    "        }\n",
+    "        ],\n",
+    "    temperature=0.6,\n",
+    "    max_completion_tokens=4096,\n",
+    "    top_p=0.95,\n",
+    "    stream=True,\n",
+    "    stop=None,\n",
+    ")\n",
+    "\n",
+    "chunks = []\n",
+    "for chunk in completion:\n",
+    "    current_chunk = chunk.choices[0].delta.content or \"\"\n",
+    "    chunks.append(current_chunk)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "full_response = \"\".join(chunks)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "\"<think>\\nOkay, so I want to get my first paper published, but I'm not really sure where to start. I've heard that publishing research is a big deal in academia, but the process seems pretty intimidating. Let me try to break this down step by step.\\n\\nFirst, I think I need to have some research done. I remember my professor mentioning that I should start by identifying a gap in the literature. But wait, how do I even find that gap? I guess I need to read a lot of papers in my field. Maybe I can start by looking at some recent studies and see where there's something missing or where more research is needed. But I'm not exactly sure how to efficiently find these gaps. Do I just read everything and hope I spot something? That seems time-consuming.\\n\\nOnce I have an idea, I need to design a study. I'm a bit confused about the methodology part. Should I go for an experimental approach or maybe a review? I think it depends on what I'm researching. If I'm testing a hypothesis, an experiment makes sense, but if I'm synthesizing existing information, a review might be better. But I'm not sure which one is more likely to get accepted, especially as a first-time author.\\n\\nAfter designing the study, I need to conduct the research. This part might take a while. I'm worried about collecting enough data and ensuring it's reliable. What if my results aren't significant? Does that mean my paper won't get published? I guess even negative results can be valuable, but I'm not certain how journals view them.\\n\\nNext, I need to write the paper. I'm a bit overwhelmed by the structure: title, abstract, introduction, methods, results, discussion, conclusion, references. Each section has its own requirements. The abstract is supposed to summarize everything, but I'm not sure how to make it concise yet. The introduction needs to set up the problem, but I'm not confident in my ability to clearly state the research gap. I've heard that the discussion section is where I interpret the results, but I'm worried about overstepping and making unsupported claims.\\n\\nChoosing the right journal is another hurdle. There are so many journals out there, and each has different scopes and impact factors. How do I pick one that's a good fit? I don't want to aim too high and get rejected, but I also don't want to aim too low. Maybe I should look at where similar studies have been published. But how do I assess the impact factor? Is it just about the number, or are there other factors?\\n\\nOnce the paper is written, I need to format it according to the journal's guidelines. This includes things like citation style, font, margins, etc. I'm a bit nervous about missing some formatting detail and having the paper rejected because of that. Maybe I should double-check the guidelines multiple times or use a template.\\n\\nThen comes the submission process. I think most journals use online systems, so I'll need to create an account and upload my manuscript. I'm a bit confused about what to include besides the manuscript—like a cover letter. What should I write in the cover letter? Do I just state the title and that it's original work, or is there more to it?\\n\\nAfter submission, the waiting game begins. I've heard that peer review can take months, which is a long time. What happens if the reviewers reject my paper? I guess I can revise and resubmit, but I'm not sure how to handle negative feedback. It might be discouraging, especially if I'm really invested in the work.\\n\\nIf it gets accepted, I'll have to deal with the production process—proofreading, layouts, etc. I'm not sure how involved that is. Do I need to check every single detail, or is it handled by the journal? I hope they catch any mistakes, but I know I should still review it carefully.\\n\\nPromotion is something I hadn't thought about. After publication, I should probably share it on social media and maybe my institution's platform. But I'm not very active on these platforms, so I'm not sure how effective that will be. Maybe I should set up a few profiles just for this purpose.\\n\\nEthical considerations are important too. I need to make sure I didn't plagiarize anything, even accidentally. Using proper citations is crucial, but I'm sometimes unsure if I'm citing correctly. Also, if I used any data that's sensitive, I need to anonymize it properly. I should probably run my paper through a plagiarism checker before submission.\\n\\nStaying persistent is the last step. I know publishing can involve multiple rejections, but I'm not sure how to handle that mentally. It might be tough to keep going after a rejection, but I guess every successful researcher has been through that.\\n\\nOverall, I think the key steps are: identify a research gap, design the study, conduct the research, write the paper, choose the right journal, format correctly, submit, handle peer review, and then promote the work. But each step has its own challenges, and I'm not entirely confident in my ability to navigate them all. Maybe I should seek guidance from my professor or a mentor to help me through the process. They might have tips or can review my work before I submit it. I should also start early and give myself plenty of time, especially since peer review can take a while. It's a lot to take in, but breaking it down into manageable steps makes it feel more achievable.\\n</think>\\n\\nPublishing your first research paper is a significant academic milestone. Here's a structured approach to guide you through the process, addressing each step with clarity and confidence:\\n\\n### 1. Identify a Research Gap\\n- **Literature Review:** Begin by reading recent studies in your field. Use academic databases like PubMed, Google Scholar, or Web of Science to find relevant papers.\\n- **Spotting Gaps:** Look for areas where the current research is lacking or inconclusive. This could be a understudied population, a novel application of a method, or unanswered questions.\\n\\n### 2. Design Your Study\\n- **Methodology:** Choose between experimental, observational, or review studies based on your research question. Experimental designs test hypotheses, while reviews synthesize existing data.\\n- **Feasibility:** Ensure your study is feasible with available resources and time.\\n\\n### 3. Conduct the Research\\n- **Data Collection:** Collect data meticulously, ensuring reliability. Consider using pilot studies to test your methods.\\n- **Ethical Considerations:** Obtain necessary approvals (e.g., IRB) and ensure confidentiality and informed consent.\\n\\n### 4. Write the Paper\\n- **Structure:** Organize your paper into sections: Title, Abstract, Introduction, Methods, Results, Discussion, Conclusion, References.\\n  - **Abstract:** Summarize your study succinctly, highlighting objectives, methods, results, and conclusions.\\n  - **Introduction:** Clearly state the research gap and objectives.\\n  - **Discussion:** Interpret results, relate them to existing literature, and discuss implications.\\n\\n### 5. Choose the Right Journal\\n- **Journal Selection:** Consider journals where similar studies have been published. Check the scope, impact factor, and audience.\\n- **Target Appropriately:** Balance between high-impact and realistic targets. Consider open-access options for broader reach.\\n\\n### 6. Format and Submit\\n- **Formatting:** Adhere strictly to the journal’s guidelines, including citation style (e.g., APA, MLA).\\n- **Cover Letter:** Briefly introduce your manuscript, state its originality, and mention any conflicts of interest.\\n\\n### 7. Peer Review Process\\n- **Submission:** Use the journal’s online system. Be prepared for a wait, as peer review can take months.\\n- **Revisions:** If revisions are requested, address them thoroughly. Use feedback to improve your manuscript.\\n\\n### 8. Post-Acceptance\\n- **Production:** Review proofs carefully for errors. Ensure all figures and tables are correctly placed.\\n- **Promotion:** Share your paper on social media, academic platforms, and through your institution. Consider creating profiles for this purpose.\\n\\n### 9. Ethical and Legal Considerations\\n- **Plagiarism:** Use plagiarism checkers like Turnitin. Ensure all citations are correctly formatted.\\n- **Data Protection:** Anonymize sensitive data and obtain necessary consents.\\n\\n### 10. Persistence and Learning\\n- **Handle Rejections:** View rejections as part of the process. Use feedback to improve future submissions.\\n- **Stay Persistent:** Keep submitting and learning from each experience.\\n\\n### Additional Tips\\n- **Seek Mentorship:** Consult with professors or mentors for guidance and reviews.\\n- **Start Early:** Allow ample time for each step, especially peer review.\\n- **Collaborate:** Work with colleagues or peers to gain different perspectives and support.\\n\\nBy following these steps and maintaining persistence, you can successfully navigate the publication process and contribute valuable research to your field.\""
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "full_response"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "thought_process_match = re.search(r\"<think>\\s*(.*?)\\s*</think>\", full_response, re.DOTALL)\n",
+    "thought_process = thought_process_match.group(1) if thought_process_match else \"\"\n",
+    "\n",
+    "actual_response = re.sub(r\"<think>.*?</think>\\s*\", \"\", full_response, flags=re.DOTALL)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "\"Okay, so I want to get my first paper published, but I'm not really sure where to start. I've heard that publishing research is a big deal in academia, but the process seems pretty intimidating. Let me try to break this down step by step.\\n\\nFirst, I think I need to have some research done. I remember my professor mentioning that I should start by identifying a gap in the literature. But wait, how do I even find that gap? I guess I need to read a lot of papers in my field. Maybe I can start by looking at some recent studies and see where there's something missing or where more research is needed. But I'm not exactly sure how to efficiently find these gaps. Do I just read everything and hope I spot something? That seems time-consuming.\\n\\nOnce I have an idea, I need to design a study. I'm a bit confused about the methodology part. Should I go for an experimental approach or maybe a review? I think it depends on what I'm researching. If I'm testing a hypothesis, an experiment makes sense, but if I'm synthesizing existing information, a review might be better. But I'm not sure which one is more likely to get accepted, especially as a first-time author.\\n\\nAfter designing the study, I need to conduct the research. This part might take a while. I'm worried about collecting enough data and ensuring it's reliable. What if my results aren't significant? Does that mean my paper won't get published? I guess even negative results can be valuable, but I'm not certain how journals view them.\\n\\nNext, I need to write the paper. I'm a bit overwhelmed by the structure: title, abstract, introduction, methods, results, discussion, conclusion, references. Each section has its own requirements. The abstract is supposed to summarize everything, but I'm not sure how to make it concise yet. The introduction needs to set up the problem, but I'm not confident in my ability to clearly state the research gap. I've heard that the discussion section is where I interpret the results, but I'm worried about overstepping and making unsupported claims.\\n\\nChoosing the right journal is another hurdle. There are so many journals out there, and each has different scopes and impact factors. How do I pick one that's a good fit? I don't want to aim too high and get rejected, but I also don't want to aim too low. Maybe I should look at where similar studies have been published. But how do I assess the impact factor? Is it just about the number, or are there other factors?\\n\\nOnce the paper is written, I need to format it according to the journal's guidelines. This includes things like citation style, font, margins, etc. I'm a bit nervous about missing some formatting detail and having the paper rejected because of that. Maybe I should double-check the guidelines multiple times or use a template.\\n\\nThen comes the submission process. I think most journals use online systems, so I'll need to create an account and upload my manuscript. I'm a bit confused about what to include besides the manuscript—like a cover letter. What should I write in the cover letter? Do I just state the title and that it's original work, or is there more to it?\\n\\nAfter submission, the waiting game begins. I've heard that peer review can take months, which is a long time. What happens if the reviewers reject my paper? I guess I can revise and resubmit, but I'm not sure how to handle negative feedback. It might be discouraging, especially if I'm really invested in the work.\\n\\nIf it gets accepted, I'll have to deal with the production process—proofreading, layouts, etc. I'm not sure how involved that is. Do I need to check every single detail, or is it handled by the journal? I hope they catch any mistakes, but I know I should still review it carefully.\\n\\nPromotion is something I hadn't thought about. After publication, I should probably share it on social media and maybe my institution's platform. But I'm not very active on these platforms, so I'm not sure how effective that will be. Maybe I should set up a few profiles just for this purpose.\\n\\nEthical considerations are important too. I need to make sure I didn't plagiarize anything, even accidentally. Using proper citations is crucial, but I'm sometimes unsure if I'm citing correctly. Also, if I used any data that's sensitive, I need to anonymize it properly. I should probably run my paper through a plagiarism checker before submission.\\n\\nStaying persistent is the last step. I know publishing can involve multiple rejections, but I'm not sure how to handle that mentally. It might be tough to keep going after a rejection, but I guess every successful researcher has been through that.\\n\\nOverall, I think the key steps are: identify a research gap, design the study, conduct the research, write the paper, choose the right journal, format correctly, submit, handle peer review, and then promote the work. But each step has its own challenges, and I'm not entirely confident in my ability to navigate them all. Maybe I should seek guidance from my professor or a mentor to help me through the process. They might have tips or can review my work before I submit it. I should also start early and give myself plenty of time, especially since peer review can take a while. It's a lot to take in, but breaking it down into manageable steps makes it feel more achievable.\""
+      ]
+     },
+     "execution_count": 12,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "thought_process"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "\"Publishing your first research paper is a significant academic milestone. Here's a structured approach to guide you through the process, addressing each step with clarity and confidence:\\n\\n### 1. Identify a Research Gap\\n- **Literature Review:** Begin by reading recent studies in your field. Use academic databases like PubMed, Google Scholar, or Web of Science to find relevant papers.\\n- **Spotting Gaps:** Look for areas where the current research is lacking or inconclusive. This could be a understudied population, a novel application of a method, or unanswered questions.\\n\\n### 2. Design Your Study\\n- **Methodology:** Choose between experimental, observational, or review studies based on your research question. Experimental designs test hypotheses, while reviews synthesize existing data.\\n- **Feasibility:** Ensure your study is feasible with available resources and time.\\n\\n### 3. Conduct the Research\\n- **Data Collection:** Collect data meticulously, ensuring reliability. Consider using pilot studies to test your methods.\\n- **Ethical Considerations:** Obtain necessary approvals (e.g., IRB) and ensure confidentiality and informed consent.\\n\\n### 4. Write the Paper\\n- **Structure:** Organize your paper into sections: Title, Abstract, Introduction, Methods, Results, Discussion, Conclusion, References.\\n  - **Abstract:** Summarize your study succinctly, highlighting objectives, methods, results, and conclusions.\\n  - **Introduction:** Clearly state the research gap and objectives.\\n  - **Discussion:** Interpret results, relate them to existing literature, and discuss implications.\\n\\n### 5. Choose the Right Journal\\n- **Journal Selection:** Consider journals where similar studies have been published. Check the scope, impact factor, and audience.\\n- **Target Appropriately:** Balance between high-impact and realistic targets. Consider open-access options for broader reach.\\n\\n### 6. Format and Submit\\n- **Formatting:** Adhere strictly to the journal’s guidelines, including citation style (e.g., APA, MLA).\\n- **Cover Letter:** Briefly introduce your manuscript, state its originality, and mention any conflicts of interest.\\n\\n### 7. Peer Review Process\\n- **Submission:** Use the journal’s online system. Be prepared for a wait, as peer review can take months.\\n- **Revisions:** If revisions are requested, address them thoroughly. Use feedback to improve your manuscript.\\n\\n### 8. Post-Acceptance\\n- **Production:** Review proofs carefully for errors. Ensure all figures and tables are correctly placed.\\n- **Promotion:** Share your paper on social media, academic platforms, and through your institution. Consider creating profiles for this purpose.\\n\\n### 9. Ethical and Legal Considerations\\n- **Plagiarism:** Use plagiarism checkers like Turnitin. Ensure all citations are correctly formatted.\\n- **Data Protection:** Anonymize sensitive data and obtain necessary consents.\\n\\n### 10. Persistence and Learning\\n- **Handle Rejections:** View rejections as part of the process. Use feedback to improve future submissions.\\n- **Stay Persistent:** Keep submitting and learning from each experience.\\n\\n### Additional Tips\\n- **Seek Mentorship:** Consult with professors or mentors for guidance and reviews.\\n- **Start Early:** Allow ample time for each step, especially peer review.\\n- **Collaborate:** Work with colleagues or peers to gain different perspectives and support.\\n\\nBy following these steps and maintaining persistence, you can successfully navigate the publication process and contribute valuable research to your field.\""
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "actual_response"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.1"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+streamlit==1.42.0
+python-dotenv==1.0.1
+groq==0.20.0
+pymupdf== 1.25.4

utils.py ADDED Viewed

	@@ -0,0 +1,64 @@

+import os
+import re
+from dotenv import load_dotenv
+from typing import Tuple
+from groq import Groq
+def get_api_key() -> str:
+    """
+    Get the api key to the LLM
+    Returns:
+        str: The api key to be used to reach the LLM
+    """
+    load_dotenv()
+    api_key = os.getenv('key')
+    return api_key
+def get_response(prompt: str, api_key) -> Tuple[str, str]:
+    """
+    Gets the response of the LLM on the provided prompt.
+    Args:
+        prompt (str): The prompt to be plugged in
+    Returns:
+        tuple:
+            str: Includes the thinking part of the LLM, showing its thought process.
+            str: The actual answer to your prompt
+    """
+    client = Groq(api_key=api_key)
+    completion = client.chat.completions.create(
+        model="deepseek-r1-distill-llama-70b",
+        messages=[
+            {
+                'role': 'user',
+                'content': prompt
+            }
+            ],
+        temperature=0.6,
+        max_completion_tokens=4096,
+        top_p=0.95,
+        stream=True,
+        stop=None,
+    )
+    chunks = []
+    for chunk in completion:
+        current_chunk = chunk.choices[0].delta.content or ""
+        chunks.append(current_chunk)
+    full_response = "".join(chunks)
+    # Splitting the text
+    thought_process_match = re.search(r"<think>\s*(.*?)\s*</think>", full_response, re.DOTALL)
+    thought_process = thought_process_match.group(1) if thought_process_match else ""
+    actual_response = re.sub(r"<think>.*?</think>\s*", "", full_response, flags=re.DOTALL)
+    return thought_process, actual_response