tykiww commited on
Commit
ab084df
·
verified ·
1 Parent(s): 2f1a468

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +26 -10
app.py CHANGED
@@ -29,14 +29,17 @@ def upload_visibility(radio):
29
  else:
30
  return gr.UploadButton(visible=bool(0))
31
 
32
- def get_dataset(dataset_predefined, dataset_upload, data_field):
 
 
 
 
33
 
34
- if dataset_predefined.visible:
35
- print('')
36
- else:
37
- print('')
38
- return 0
39
 
 
 
 
 
40
 
41
 
42
 
@@ -80,7 +83,7 @@ def main():
80
  ##### Title Block #####
81
  gr.Markdown("# Instruction Tuning with Unsloth")
82
 
83
- ##### Model Inputs #####
84
  gr.Markdown("### Model Inputs")
85
 
86
  # Select Model
@@ -98,18 +101,31 @@ def main():
98
  dataset_predefined = gr.Textbox(label="Hugging Face Hub Dataset",
99
  value='yahma/alpaca-cleaned',
100
  visible=True)
101
- dataset_upload = gr.UploadButton(label="Upload Dataset (csv, jsonl, or txt)",
 
102
  file_types=[".csv",".jsonl", ".txt"],
103
  visible=False)
104
  data_field = gr.Textbox(label="Dataset Training Field",
105
  value=conf['model']['general']["dataset_text_field"])
 
106
  dataset_choice.change(textbox_visibility,
107
  dataset_choice,
108
  dataset_predefined)
109
  dataset_choice.change(upload_visibility,
110
  dataset_choice,
111
  dataset_upload)
 
 
 
 
 
 
 
 
 
 
112
 
 
113
  gr.Markdown("### Model Parameter Selection")
114
  # Parameters
115
  max_seq_length = gr.Textbox(label="Maximum sequence length",
@@ -138,7 +154,7 @@ def main():
138
 
139
  ##### Execution #####
140
 
141
- # Setup button
142
  tune_btn = gr.Button("Start Fine Tuning")
143
  gr.Markdown("### Model Progress")
144
  # Text output (for now)
@@ -148,7 +164,7 @@ def main():
148
  # Data retrieval
149
 
150
 
151
- # Execute button
152
  tune_btn.click(fn=train,
153
  inputs=[model_name,
154
  inject_prompt,
 
29
  else:
30
  return gr.UploadButton(visible=bool(0))
31
 
32
+ #from datasets import load_dataset
33
+
34
+ def get_predefined_dataset(dataset_name):
35
+ dataset = load_dataset(dataset_name, split = "train")
36
+ return dataset
37
 
 
 
 
 
 
38
 
39
+ def get_uploaded_dataset():
40
+ with open(file.name, 'r') as f:
41
+ content = f.read()
42
+ return content[0:100]
43
 
44
 
45
 
 
83
  ##### Title Block #####
84
  gr.Markdown("# Instruction Tuning with Unsloth")
85
 
86
+ ##### Initial Model Inputs #####
87
  gr.Markdown("### Model Inputs")
88
 
89
  # Select Model
 
101
  dataset_predefined = gr.Textbox(label="Hugging Face Hub Dataset",
102
  value='yahma/alpaca-cleaned',
103
  visible=True)
104
+ dataset_predefined_load = gr.Button("Upload Dataset")
105
+ dataset_uploaded_load = gr.UploadButton(label="Upload Dataset (csv, jsonl, or txt)",
106
  file_types=[".csv",".jsonl", ".txt"],
107
  visible=False)
108
  data_field = gr.Textbox(label="Dataset Training Field",
109
  value=conf['model']['general']["dataset_text_field"])
110
+ data_snippet = gr.Markdown()
111
  dataset_choice.change(textbox_visibility,
112
  dataset_choice,
113
  dataset_predefined)
114
  dataset_choice.change(upload_visibility,
115
  dataset_choice,
116
  dataset_upload)
117
+
118
+ # Dataset button
119
+ dataset_predefined_load.click(fn=get_predefined_dataset
120
+ inputs=dataset_predefined_load,
121
+ outputs=data_snippet)
122
+
123
+ dataset_uploaded_load.click(fn=get_uploaded_dataset,
124
+ inputs=dataset_uploaded_load,
125
+ outputs=data_snippet)
126
+
127
 
128
+ ##### Model Parameter Inputs #####
129
  gr.Markdown("### Model Parameter Selection")
130
  # Parameters
131
  max_seq_length = gr.Textbox(label="Maximum sequence length",
 
154
 
155
  ##### Execution #####
156
 
157
+ # Setup buttons
158
  tune_btn = gr.Button("Start Fine Tuning")
159
  gr.Markdown("### Model Progress")
160
  # Text output (for now)
 
164
  # Data retrieval
165
 
166
 
167
+ # Execute buttons
168
  tune_btn.click(fn=train,
169
  inputs=[model_name,
170
  inject_prompt,