Spaces:
Sleeping
Sleeping
ehristoforu
commited on
Commit
•
e5bc143
1
Parent(s):
9f8439e
Update webui.py
Browse files
webui.py
CHANGED
@@ -5,7 +5,6 @@ import time
|
|
5 |
if echo == "True":
|
6 |
from modules.echo import *
|
7 |
|
8 |
-
import spaces
|
9 |
|
10 |
import os
|
11 |
import gradio as gr
|
@@ -60,7 +59,7 @@ with gr.Blocks(theme=theme, title=f"TensorLM v{tlm_version} Demo", css="style.cs
|
|
60 |
with gr.Row(render=False) as settings:
|
61 |
reload_model = gr.Button("Apply settings to model", interactive=True)
|
62 |
n_ctx = gr.Slider(label="Number of CTX", minimum=1024, maximum=4056, value=2048, step=8, interactive=True)
|
63 |
-
n_gpu_layers = gr.Slider(label="Number of GPU layers", minimum=0, maximum=36, value=
|
64 |
n_threads = gr.Slider(label="Number of Threads", minimum=2, maximum=36, value=8, step=1, interactive=True)
|
65 |
verbose = gr.Checkbox(label="Verbose", value=True, interactive=True)
|
66 |
f16_kv = gr.Checkbox(label="F16 KV", value=True, interactive=True)
|
@@ -70,7 +69,7 @@ with gr.Blocks(theme=theme, title=f"TensorLM v{tlm_version} Demo", css="style.cs
|
|
70 |
use_mlock = gr.Checkbox(label="Use mlock", value=False, interactive=True)
|
71 |
n_batch = gr.Slider(label="Number of batch", minimum=128, maximum=2048, value=512, step=8, interactive=True)
|
72 |
last_n_tokens_size = gr.Slider(label="Last number of tokens size", minimum=8, maximum=512, value=64, step=8, interactive=True)
|
73 |
-
low_vram = gr.Checkbox(label="Low VRAM", value=lowvram_arg, interactive=
|
74 |
rope_freq_base = gr.Slider(label="Rope freq base", minimum=1000.0, maximum=30000.0, value=10000.0, step=0.1, interactive=True)
|
75 |
rope_freq_scale = gr.Slider(label="Rope freq scale", minimum=0.1, maximum=3.0, value=1.0, step=0.1)
|
76 |
|
|
|
5 |
if echo == "True":
|
6 |
from modules.echo import *
|
7 |
|
|
|
8 |
|
9 |
import os
|
10 |
import gradio as gr
|
|
|
59 |
with gr.Row(render=False) as settings:
|
60 |
reload_model = gr.Button("Apply settings to model", interactive=True)
|
61 |
n_ctx = gr.Slider(label="Number of CTX", minimum=1024, maximum=4056, value=2048, step=8, interactive=True)
|
62 |
+
n_gpu_layers = gr.Slider(label="Number of GPU layers", minimum=0, maximum=36, value=0, step=1, interactive=False)
|
63 |
n_threads = gr.Slider(label="Number of Threads", minimum=2, maximum=36, value=8, step=1, interactive=True)
|
64 |
verbose = gr.Checkbox(label="Verbose", value=True, interactive=True)
|
65 |
f16_kv = gr.Checkbox(label="F16 KV", value=True, interactive=True)
|
|
|
69 |
use_mlock = gr.Checkbox(label="Use mlock", value=False, interactive=True)
|
70 |
n_batch = gr.Slider(label="Number of batch", minimum=128, maximum=2048, value=512, step=8, interactive=True)
|
71 |
last_n_tokens_size = gr.Slider(label="Last number of tokens size", minimum=8, maximum=512, value=64, step=8, interactive=True)
|
72 |
+
low_vram = gr.Checkbox(label="Low VRAM", value=lowvram_arg, interactive=False)
|
73 |
rope_freq_base = gr.Slider(label="Rope freq base", minimum=1000.0, maximum=30000.0, value=10000.0, step=0.1, interactive=True)
|
74 |
rope_freq_scale = gr.Slider(label="Rope freq scale", minimum=0.1, maximum=3.0, value=1.0, step=0.1)
|
75 |
|