Namitg02 commited on
Commit
f125e9c
·
verified ·
1 Parent(s): 49627b2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +13 -0
app.py CHANGED
@@ -11,6 +11,19 @@ from transformers import AutoTokenizer
11
  from transformers import AutoModelForCausalLM
12
  from transformers import TextIteratorStreamer
13
  from threading import Thread
 
 
 
 
 
 
 
 
 
 
 
 
 
14
 
15
  llm_model = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
16
  tokenizer = AutoTokenizer.from_pretrained(llm_model)
 
11
  from transformers import AutoModelForCausalLM
12
  from transformers import TextIteratorStreamer
13
  from threading import Thread
14
+ from torchtext.data import to_map_style_dataset
15
+
16
+ llm_model = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
17
+ tokenizer = AutoTokenizer.from_pretrained(llm_model)
18
+ # pulling tokeinzer for text generation model
19
+
20
+ #import numpy as np
21
+
22
+ datasetiter = load_dataset("Namitg02/Test", split='train', streaming=False)
23
+ #dataset = np.array(list(datasetiter))
24
+
25
+ #dataset = np.dataset(np.array(list(datasetiter)))
26
+ dataset = to_map_style_dataset(datasetiter)
27
 
28
  llm_model = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
29
  tokenizer = AutoTokenizer.from_pretrained(llm_model)