Spaces:
Build error
Build error
Update webui.py
Browse files
webui.py
CHANGED
|
@@ -5,7 +5,6 @@ import time
|
|
| 5 |
if echo == "True":
|
| 6 |
from modules.echo import *
|
| 7 |
|
| 8 |
-
import spaces
|
| 9 |
|
| 10 |
import os
|
| 11 |
import gradio as gr
|
|
@@ -60,7 +59,7 @@ with gr.Blocks(theme=theme, title=f"TensorLM v{tlm_version} Demo", css="style.cs
|
|
| 60 |
with gr.Row(render=False) as settings:
|
| 61 |
reload_model = gr.Button("Apply settings to model", interactive=True)
|
| 62 |
n_ctx = gr.Slider(label="Number of CTX", minimum=1024, maximum=4056, value=2048, step=8, interactive=True)
|
| 63 |
-
n_gpu_layers = gr.Slider(label="Number of GPU layers", minimum=0, maximum=36, value=
|
| 64 |
n_threads = gr.Slider(label="Number of Threads", minimum=2, maximum=36, value=8, step=1, interactive=True)
|
| 65 |
verbose = gr.Checkbox(label="Verbose", value=True, interactive=True)
|
| 66 |
f16_kv = gr.Checkbox(label="F16 KV", value=True, interactive=True)
|
|
@@ -70,7 +69,7 @@ with gr.Blocks(theme=theme, title=f"TensorLM v{tlm_version} Demo", css="style.cs
|
|
| 70 |
use_mlock = gr.Checkbox(label="Use mlock", value=False, interactive=True)
|
| 71 |
n_batch = gr.Slider(label="Number of batch", minimum=128, maximum=2048, value=512, step=8, interactive=True)
|
| 72 |
last_n_tokens_size = gr.Slider(label="Last number of tokens size", minimum=8, maximum=512, value=64, step=8, interactive=True)
|
| 73 |
-
low_vram = gr.Checkbox(label="Low VRAM", value=lowvram_arg, interactive=
|
| 74 |
rope_freq_base = gr.Slider(label="Rope freq base", minimum=1000.0, maximum=30000.0, value=10000.0, step=0.1, interactive=True)
|
| 75 |
rope_freq_scale = gr.Slider(label="Rope freq scale", minimum=0.1, maximum=3.0, value=1.0, step=0.1)
|
| 76 |
|
|
|
|
| 5 |
if echo == "True":
|
| 6 |
from modules.echo import *
|
| 7 |
|
|
|
|
| 8 |
|
| 9 |
import os
|
| 10 |
import gradio as gr
|
|
|
|
| 59 |
with gr.Row(render=False) as settings:
|
| 60 |
reload_model = gr.Button("Apply settings to model", interactive=True)
|
| 61 |
n_ctx = gr.Slider(label="Number of CTX", minimum=1024, maximum=4056, value=2048, step=8, interactive=True)
|
| 62 |
+
n_gpu_layers = gr.Slider(label="Number of GPU layers", minimum=0, maximum=36, value=0, step=1, interactive=False)
|
| 63 |
n_threads = gr.Slider(label="Number of Threads", minimum=2, maximum=36, value=8, step=1, interactive=True)
|
| 64 |
verbose = gr.Checkbox(label="Verbose", value=True, interactive=True)
|
| 65 |
f16_kv = gr.Checkbox(label="F16 KV", value=True, interactive=True)
|
|
|
|
| 69 |
use_mlock = gr.Checkbox(label="Use mlock", value=False, interactive=True)
|
| 70 |
n_batch = gr.Slider(label="Number of batch", minimum=128, maximum=2048, value=512, step=8, interactive=True)
|
| 71 |
last_n_tokens_size = gr.Slider(label="Last number of tokens size", minimum=8, maximum=512, value=64, step=8, interactive=True)
|
| 72 |
+
low_vram = gr.Checkbox(label="Low VRAM", value=lowvram_arg, interactive=False)
|
| 73 |
rope_freq_base = gr.Slider(label="Rope freq base", minimum=1000.0, maximum=30000.0, value=10000.0, step=0.1, interactive=True)
|
| 74 |
rope_freq_scale = gr.Slider(label="Rope freq scale", minimum=0.1, maximum=3.0, value=1.0, step=0.1)
|
| 75 |
|