Spaces:

Ono-Enzo
/

test-space

Build error

App Files Files Community

Ono-Enzo commited on Jun 25, 2024

Commit

770d2f5

verified ·

1 Parent(s): 2e2eee1

Upload 8 files

Browse files

Files changed (4) hide show

.gitignore +1 -1
README.md +23 -3
app.py +6 -0
utils.py +2 -0

.gitignore CHANGED Viewed

@@ -157,4 +157,4 @@ cython_debug/
 #  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
 #  and can be added to the global gitignore or merged into this file.  For a more nuclear
 #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
-#.idea/

 #  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
 #  and can be added to the global gitignore or merged into this file.  For a more nuclear
 #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/

README.md CHANGED Viewed

@@ -1,10 +1,11 @@
 title: QASports Website - Basketball
 emoji: 👁
 colorFrom: purple
 colorTo: green
 sdk: streamlit
 sdk_version: 1.33.0
-python_version: 3.1
 suggested_hardware: t4-small
 app_file: app.py
 pinned: false
@@ -14,8 +15,27 @@ tags:
   - question-answering
   - open-domain-qa
   - extractive-qa
-short_description: QASports the first large sports-themed QA dataset
 models:
   - deepset/roberta-base-squad2
 datasets:
-  - PedroCJardim/QASports

+---
 title: QASports Website - Basketball
 emoji: 👁
 colorFrom: purple
 colorTo: green
 sdk: streamlit
 sdk_version: 1.33.0
+python_version: 3.10
 suggested_hardware: t4-small
 app_file: app.py
 pinned: false
   - question-answering
   - open-domain-qa
   - extractive-qa
+short_description: "QASports the first large sports-themed QA dataset"
 models:
   - deepset/roberta-base-squad2
 datasets:
+  - PedroCJardim/QASports
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+# Website
+This website presents a collection of documents from the dataset named "QASports", the first large sports question answering dataset for open questions. QASports contains real data of players, teams and matches from the sports soccer, basketball and American football.
+- 💻 Website: https://huggingface.co/spaces/leomaurodesenv/qasports-website
+- 🔧 Scripts: https://github.com/leomaurodesenv/qasports-dataset-website
+> **Note**. As first version, we are only focusing in Basketball data.
+## Dataset Summary
+QASports is the first large sports-themed question answering dataset counting over 1.5 million questions and answers about 54k preprocessed wiki pages, using as documents the wiki of 3 of the most popular sports in the world, Soccer, American Football and Basketball. Each sport can be downloaded individually as a subset, with the train, test and validation splits, or all 3 can be downloaded together.
+- 🎲 Dataset: https://huggingface.co/datasets/PedroCJardim/QASports
+- 🔧 Scripts: https://github.com/leomaurodesenv/qasports-dataset-scripts/

app.py CHANGED Viewed

@@ -13,6 +13,7 @@ from utils import get_unique_docs
 def load_documents():
     """
     Load the documents from the dataset considering only unique documents.
     Returns:
     - documents: list of dictionaries with the documents.
     """
@@ -33,6 +34,7 @@ def load_documents():
 def get_document_store(documents):
     """
     Index the files in the document store.
     Args:
     - files: list of dictionaries with the documents.
     """
@@ -47,8 +49,10 @@ def get_document_store(documents):
 def get_question_pipeline(_doc_store):
     """
     Create the pipeline with the retriever and reader components.
     Args:
     - doc_store: instance of the document store.
     Returns:
     - pipe: instance of the pipeline.
     """
@@ -68,9 +72,11 @@ def get_question_pipeline(_doc_store):
 def search(pipeline, question: str):
     """
     Search for the answer to a question in the documents.
     Args:
     - pipeline: instance of the pipeline.
     - question: string with the question.
     Returns:
     - answer: dictionary with the answer.
     """

 def load_documents():
     """
     Load the documents from the dataset considering only unique documents.
     Returns:
     - documents: list of dictionaries with the documents.
     """
 def get_document_store(documents):
     """
     Index the files in the document store.
     Args:
     - files: list of dictionaries with the documents.
     """
 def get_question_pipeline(_doc_store):
     """
     Create the pipeline with the retriever and reader components.
     Args:
     - doc_store: instance of the document store.
     Returns:
     - pipe: instance of the pipeline.
     """
 def search(pipeline, question: str):
     """
     Search for the answer to a question in the documents.
     Args:
     - pipeline: instance of the pipeline.
     - question: string with the question.
     Returns:
     - answer: dictionary with the answer.
     """

utils.py CHANGED Viewed

@@ -6,8 +6,10 @@ from haystack import Document
 def get_unique_docs(dataset, unique_docs: set):
     """Get unique documents from dataset
     Args:
     dataset: list of dictionaries
     Returns:
     docs: list of haystack.Document
     """

 def get_unique_docs(dataset, unique_docs: set):
     """Get unique documents from dataset
     Args:
     dataset: list of dictionaries
     Returns:
     docs: list of haystack.Document
     """