Namitg02 commited on
Commit
117bfa6
·
verified ·
1 Parent(s): 49f4c57

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -9
app.py CHANGED
@@ -25,15 +25,6 @@ dataset = load_dataset("Namitg02/Test", split='train', streaming=False)
25
  #Returns a list of dictionaries, each representing a row in the dataset.
26
  print(dataset[1])
27
  length = len(dataset)
28
- df = pd.DataFrame(dataset)
29
-
30
- embeddings = embedding_model.encode(dataset["text"])
31
- print(embeddings)
32
-
33
- df['embeddings'] = embeddings
34
- dataset = Dataset.from_pandas(df)
35
- print(dataset[1])
36
-
37
 
38
  #Itemdetails = dataset.items()
39
  #print(Itemdetails)
@@ -42,6 +33,16 @@ embedding_model = SentenceTransformer("mixedbread-ai/mxbai-embed-large-v1")
42
  #embedding_model = HuggingFaceEmbeddings(model_name = "mixedbread-ai/mxbai-embed-large-v1")
43
  #all-MiniLM-L6-v2, BAAI/bge-base-en-v1.5,infgrad/stella-base-en-v2, BAAI/bge-large-en-v1.5 working with default dimensions
44
 
 
 
 
 
 
 
 
 
 
 
45
  #doc_func = lambda x: x.text
46
  #dataset = list(map(doc_func, dataset))
47
 
 
25
  #Returns a list of dictionaries, each representing a row in the dataset.
26
  print(dataset[1])
27
  length = len(dataset)
 
 
 
 
 
 
 
 
 
28
 
29
  #Itemdetails = dataset.items()
30
  #print(Itemdetails)
 
33
  #embedding_model = HuggingFaceEmbeddings(model_name = "mixedbread-ai/mxbai-embed-large-v1")
34
  #all-MiniLM-L6-v2, BAAI/bge-base-en-v1.5,infgrad/stella-base-en-v2, BAAI/bge-large-en-v1.5 working with default dimensions
35
 
36
+ df = pd.DataFrame(dataset)
37
+ display(df)
38
+ embeddings = embedding_model.encode(dataset["text"])
39
+ print(embeddings)
40
+ df['embeddings'] = embeddings
41
+ display(df)
42
+ dataset = Dataset.from_pandas(df)
43
+ print(dataset[1])
44
+ print(dataset[2])
45
+
46
  #doc_func = lambda x: x.text
47
  #dataset = list(map(doc_func, dataset))
48