Spaces:

CannaTech
/

CannaAssist

Build error

App Files Files

CannaTech commited on Jul 3, 2023

Commit

03435e9

1 Parent(s): 5382d52

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -169

app.py CHANGED Viewed

@@ -1,181 +1,15 @@
-# Import the necessary libraries
-from __future__ import annotations
 import os
 import openai
 import gradio as gr
 import csv
 import json
-import io
-import uuid
-import datetime
-from abc import ABC, abstractmethod
-from pathlib import Path
-from typing import TYPE_CHECKING, Any, List
-from gradio.documentation import document, set_documentation_group
-from gradio.components import IOComponent
 # Set the OpenAI API key
 openai.api_key = os.getenv("OPENAI_API_KEY")
-##################
-class FlaggingCallback(ABC):
-    """
-    An abstract class for defining the methods that any FlaggingCallback should have.
-    """
-    @abstractmethod
-    def setup(self, components: List[IOComponent], flagging_dir: str):
-        """
-        This method should be overridden and ensure that everything is set up correctly for flag().
-        This method gets called once at the beginning of the Interface.launch() method.
-        Parameters:
-        components: Set of components that will provide flagged data.
-        flagging_dir: A string, typically containing the path to the directory where the flagging file should be storied (provided as an argument to Interface.__init__()).
-        """
-        pass
-    @abstractmethod
-    def flag(
-        self,
-        flag_data: List[Any],
-        flag_option: str | None = None,
-        flag_index: int | None = None,
-        username: str | None = None,
-    ) -> int:
-        """
-        This method should be overridden by the FlaggingCallback subclass and may contain optional additional arguments.
-        This gets called every time the <flag> button is pressed.
-        Parameters:
-        interface: The Interface object that is being used to launch the flagging interface.
-        flag_data: The data to be flagged.
-        flag_option (optional): In the case that flagging_options are provided, the flag option that is being used.
-        flag_index (optional): The index of the sample that is being flagged.
-        username (optional): The username of the user that is flagging the data, if logged in.
-        Returns:
-        (int) The total number of samples that have been flagged.
-        """
-        pass
-class HuggingFaceDatasetSaver(FlaggingCallback):
-    """
-    A callback that saves each flagged sample (both the input and output data)
-    to a HuggingFace dataset.
-    Example:
-        import gradio as gr
-        hf_writer = gr.HuggingFaceDatasetSaver(HF_API_TOKEN, "image-classification-mistakes")
-        def image_classifier(inp):
-            return {'cat': 0.3, 'dog': 0.7}
-        demo = gr.Interface(fn=image_classifier, inputs="image", outputs="label",
-                            allow_flagging="manual", flagging_callback=hf_writer)
-    Guides: using_flagging
-    """
-    def __init__(
-        self,
-        hf_token: str,
-        dataset_name: str,
-        organization: str | None = None,
-        private: bool = False,
-    ):
-        """
-        Parameters:
-            hf_token: The HuggingFace token to use to create (and write the flagged sample to) the HuggingFace dataset.
-            dataset_name: The name of the dataset to save the data to, e.g. "image-classifier-1"
-            organization: The organization to save the dataset under. The hf_token must provide write access to this organization. If not provided, saved under the name of the user corresponding to the hf_token.
-            private: Whether the dataset should be private (defaults to False).
-        """
-        self.hf_token = hf_token
-        self.dataset_name = dataset_name
-        self.organization_name = organization
-        self.dataset_private = private
-    def setup(self, components: List[IOComponent], flagging_dir: str):
-        """
-        Params:
-        flagging_dir (str): local directory where the dataset is cloned,
-        updated, and pushed from.
-        """
-        try:
-            import huggingface_hub
-        except (ImportError, ModuleNotFoundError):
-            raise ImportError(
-                "Package `huggingface_hub` not found is needed "
-                "for HuggingFaceDatasetSaver. Try 'pip install huggingface_hub'."
-            )
-        path_to_dataset_repo = huggingface_hub.create_repo(
-            name=self.dataset_name,
-            token=self.hf_token,
-            private=self.dataset_private,
-            repo_type="dataset",
-            exist_ok=True,
-        )
-        self.path_to_dataset_repo = path_to_dataset_repo  # e.g. "https://huggingface.co/datasets/abidlabs/test-audio-10"
-        self.components = components
-        self.flagging_dir = flagging_dir
-        self.dataset_dir = Path(flagging_dir) / self.dataset_name
-        self.repo = huggingface_hub.Repository(
-            local_dir=str(self.dataset_dir),
-            clone_from=path_to_dataset_repo,
-            use_auth_token=self.hf_token,
-        )
-        self.repo.git_pull(lfs=True)
-        # Should filename be user-specified?
-        self.log_file = Path(self.dataset_dir) / "data.csv"
-        self.infos_file = Path(self.dataset_dir) / "dataset_infos.json"
-    def flag(
-        self,
-        flag_data: List[Any],
-        flag_option: str | None = None,
-        flag_index: int | None = None,
-        username: str | None = None,
-    ) -> int:
-        self.repo.git_pull(lfs=True)
-        is_new = not Path(self.log_file).exists()
-        with open(self.log_file, "a", newline="", encoding="utf-8") as csvfile:
-            writer = csv.writer(csvfile)
-            # File previews for certain input and output types
-            infos, file_preview_types, headers = _get_dataset_features_info(
-                is_new, self.components
-            )
-            # Generate the headers and dataset_infos
-            if is_new:
-                writer.writerow(utils.sanitize_list_for_csv(headers))
-            # Generate the row corresponding to the flagged sample
-            csv_data = []
-            for component, sample in zip(self.components, flag_data):
-                save_dir = Path(
-                    self.dataset_dir
-                ) / utils.strip_invalid_filename_characters(component.label or "")
-                filepath = component.deserialize(sample, save_dir, None)
-                csv_data.append(filepath)
-                if isinstance(component, tuple(file_preview_types)):
-                    csv_data.append(
-                        "{}/resolve/main/{}".format(self.path_to_dataset_repo, filepath)
-                    )
-            csv_data.append(flag_option if flag_option is not None else "")
-            writer.writerow(utils.sanitize_list_for_csv(csv_data))
-        if is_new:
-            json.dump(infos, open(self.infos_file, "w"))
-        with open(self.log_file, "r", encoding="utf-8") as csvfile:
-            line_count = len([None for row in csv.reader(csvfile)]) - 1
-        self.repo.push_to_hub(commit_message="Flagged sample #{}".format(line_count))
-        return line_count
-##################
 # Set up flagging callback function
 HF_TOKEN = os.getenv("HF_TOKEN")

 import os
 import openai
 import gradio as gr
 import csv
 import json
 # Set the OpenAI API key
 openai.api_key = os.getenv("OPENAI_API_KEY")
+# Set up flagging callback function
+HF_TOKEN = os.getenv("HF_TOKEN")
+hf_writer = gr.HuggingFaceDatasetSaver(HF_TOKEN, "CannaTech/Flagged")
 # Set up flagging callback function
 HF_TOKEN = os.getenv("HF_TOKEN")