Update app.py
Browse files
app.py
CHANGED
@@ -29,14 +29,17 @@ def upload_visibility(radio):
|
|
29 |
else:
|
30 |
return gr.UploadButton(visible=bool(0))
|
31 |
|
32 |
-
|
|
|
|
|
|
|
|
|
33 |
|
34 |
-
if dataset_predefined.visible:
|
35 |
-
print('')
|
36 |
-
else:
|
37 |
-
print('')
|
38 |
-
return 0
|
39 |
|
|
|
|
|
|
|
|
|
40 |
|
41 |
|
42 |
|
@@ -80,7 +83,7 @@ def main():
|
|
80 |
##### Title Block #####
|
81 |
gr.Markdown("# Instruction Tuning with Unsloth")
|
82 |
|
83 |
-
##### Model Inputs #####
|
84 |
gr.Markdown("### Model Inputs")
|
85 |
|
86 |
# Select Model
|
@@ -98,18 +101,31 @@ def main():
|
|
98 |
dataset_predefined = gr.Textbox(label="Hugging Face Hub Dataset",
|
99 |
value='yahma/alpaca-cleaned',
|
100 |
visible=True)
|
101 |
-
|
|
|
102 |
file_types=[".csv",".jsonl", ".txt"],
|
103 |
visible=False)
|
104 |
data_field = gr.Textbox(label="Dataset Training Field",
|
105 |
value=conf['model']['general']["dataset_text_field"])
|
|
|
106 |
dataset_choice.change(textbox_visibility,
|
107 |
dataset_choice,
|
108 |
dataset_predefined)
|
109 |
dataset_choice.change(upload_visibility,
|
110 |
dataset_choice,
|
111 |
dataset_upload)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
112 |
|
|
|
113 |
gr.Markdown("### Model Parameter Selection")
|
114 |
# Parameters
|
115 |
max_seq_length = gr.Textbox(label="Maximum sequence length",
|
@@ -138,7 +154,7 @@ def main():
|
|
138 |
|
139 |
##### Execution #####
|
140 |
|
141 |
-
# Setup
|
142 |
tune_btn = gr.Button("Start Fine Tuning")
|
143 |
gr.Markdown("### Model Progress")
|
144 |
# Text output (for now)
|
@@ -148,7 +164,7 @@ def main():
|
|
148 |
# Data retrieval
|
149 |
|
150 |
|
151 |
-
# Execute
|
152 |
tune_btn.click(fn=train,
|
153 |
inputs=[model_name,
|
154 |
inject_prompt,
|
|
|
29 |
else:
|
30 |
return gr.UploadButton(visible=bool(0))
|
31 |
|
32 |
+
#from datasets import load_dataset
|
33 |
+
|
34 |
+
def get_predefined_dataset(dataset_name):
|
35 |
+
dataset = load_dataset(dataset_name, split = "train")
|
36 |
+
return dataset
|
37 |
|
|
|
|
|
|
|
|
|
|
|
38 |
|
39 |
+
def get_uploaded_dataset():
|
40 |
+
with open(file.name, 'r') as f:
|
41 |
+
content = f.read()
|
42 |
+
return content[0:100]
|
43 |
|
44 |
|
45 |
|
|
|
83 |
##### Title Block #####
|
84 |
gr.Markdown("# Instruction Tuning with Unsloth")
|
85 |
|
86 |
+
##### Initial Model Inputs #####
|
87 |
gr.Markdown("### Model Inputs")
|
88 |
|
89 |
# Select Model
|
|
|
101 |
dataset_predefined = gr.Textbox(label="Hugging Face Hub Dataset",
|
102 |
value='yahma/alpaca-cleaned',
|
103 |
visible=True)
|
104 |
+
dataset_predefined_load = gr.Button("Upload Dataset")
|
105 |
+
dataset_uploaded_load = gr.UploadButton(label="Upload Dataset (csv, jsonl, or txt)",
|
106 |
file_types=[".csv",".jsonl", ".txt"],
|
107 |
visible=False)
|
108 |
data_field = gr.Textbox(label="Dataset Training Field",
|
109 |
value=conf['model']['general']["dataset_text_field"])
|
110 |
+
data_snippet = gr.Markdown()
|
111 |
dataset_choice.change(textbox_visibility,
|
112 |
dataset_choice,
|
113 |
dataset_predefined)
|
114 |
dataset_choice.change(upload_visibility,
|
115 |
dataset_choice,
|
116 |
dataset_upload)
|
117 |
+
|
118 |
+
# Dataset button
|
119 |
+
dataset_predefined_load.click(fn=get_predefined_dataset
|
120 |
+
inputs=dataset_predefined_load,
|
121 |
+
outputs=data_snippet)
|
122 |
+
|
123 |
+
dataset_uploaded_load.click(fn=get_uploaded_dataset,
|
124 |
+
inputs=dataset_uploaded_load,
|
125 |
+
outputs=data_snippet)
|
126 |
+
|
127 |
|
128 |
+
##### Model Parameter Inputs #####
|
129 |
gr.Markdown("### Model Parameter Selection")
|
130 |
# Parameters
|
131 |
max_seq_length = gr.Textbox(label="Maximum sequence length",
|
|
|
154 |
|
155 |
##### Execution #####
|
156 |
|
157 |
+
# Setup buttons
|
158 |
tune_btn = gr.Button("Start Fine Tuning")
|
159 |
gr.Markdown("### Model Progress")
|
160 |
# Text output (for now)
|
|
|
164 |
# Data retrieval
|
165 |
|
166 |
|
167 |
+
# Execute buttons
|
168 |
tune_btn.click(fn=train,
|
169 |
inputs=[model_name,
|
170 |
inject_prompt,
|