|
|
|
import os |
|
from g4f import ChatCompletion |
|
from google.colab import userdata |
|
from pinecone import Pinecone |
|
import pandas as pd |
|
from datasets import Dataset |
|
from sentence_transformers import SentenceTransformer |
|
import gradio as gr |
|
|
|
model_name = "BAAI/bge-m3" |
|
|
|
|
|
|
|
|
|
|
|
os.environ["PINECONE_ENVIRONMENT"] = "us-east-1" |
|
os.environ["PINECONE_API_KEY"] = "3a3e9022-381d-436e-84cb-ba93464d283e" |
|
|
|
|
|
PINECONE_API_KEY = userdata.get("PINECONE_API_KEY") |
|
PINECONE_ENVIRONMENT = "us-east-1" |
|
|
|
|
|
pc = Pinecone(api_key=PINECONE_API_KEY) |
|
|
|
|
|
file_path = '/content/dataset.csv' |
|
|
|
|
|
try: |
|
df = pd.read_csv(file_path) |
|
DATASET = Dataset.from_pandas(df) |
|
print(f"Dataset '{file_path}' loaded successfully.\n") |
|
print(DATASET) |
|
except Exception as e: |
|
DATASET = None |
|
print(f"Error loading dataset: {e}") |
|
|
|
|
|
def print_dataset_info(): |
|
print(f"Current dataset: {DATASET}" if DATASET else "No dataset loaded.") |
|
|
|
|
|
get_ipython().run_cell_magic('capture', '', '%store DATASET') |
|
|