ehristoforu commited on
Commit
e5bc143
1 Parent(s): 9f8439e

Update webui.py

Browse files
Files changed (1) hide show
  1. webui.py +2 -3
webui.py CHANGED
@@ -5,7 +5,6 @@ import time
5
  if echo == "True":
6
  from modules.echo import *
7
 
8
- import spaces
9
 
10
  import os
11
  import gradio as gr
@@ -60,7 +59,7 @@ with gr.Blocks(theme=theme, title=f"TensorLM v{tlm_version} Demo", css="style.cs
60
  with gr.Row(render=False) as settings:
61
  reload_model = gr.Button("Apply settings to model", interactive=True)
62
  n_ctx = gr.Slider(label="Number of CTX", minimum=1024, maximum=4056, value=2048, step=8, interactive=True)
63
- n_gpu_layers = gr.Slider(label="Number of GPU layers", minimum=0, maximum=36, value=4, step=1, interactive=True)
64
  n_threads = gr.Slider(label="Number of Threads", minimum=2, maximum=36, value=8, step=1, interactive=True)
65
  verbose = gr.Checkbox(label="Verbose", value=True, interactive=True)
66
  f16_kv = gr.Checkbox(label="F16 KV", value=True, interactive=True)
@@ -70,7 +69,7 @@ with gr.Blocks(theme=theme, title=f"TensorLM v{tlm_version} Demo", css="style.cs
70
  use_mlock = gr.Checkbox(label="Use mlock", value=False, interactive=True)
71
  n_batch = gr.Slider(label="Number of batch", minimum=128, maximum=2048, value=512, step=8, interactive=True)
72
  last_n_tokens_size = gr.Slider(label="Last number of tokens size", minimum=8, maximum=512, value=64, step=8, interactive=True)
73
- low_vram = gr.Checkbox(label="Low VRAM", value=lowvram_arg, interactive=True)
74
  rope_freq_base = gr.Slider(label="Rope freq base", minimum=1000.0, maximum=30000.0, value=10000.0, step=0.1, interactive=True)
75
  rope_freq_scale = gr.Slider(label="Rope freq scale", minimum=0.1, maximum=3.0, value=1.0, step=0.1)
76
 
 
5
  if echo == "True":
6
  from modules.echo import *
7
 
 
8
 
9
  import os
10
  import gradio as gr
 
59
  with gr.Row(render=False) as settings:
60
  reload_model = gr.Button("Apply settings to model", interactive=True)
61
  n_ctx = gr.Slider(label="Number of CTX", minimum=1024, maximum=4056, value=2048, step=8, interactive=True)
62
+ n_gpu_layers = gr.Slider(label="Number of GPU layers", minimum=0, maximum=36, value=0, step=1, interactive=False)
63
  n_threads = gr.Slider(label="Number of Threads", minimum=2, maximum=36, value=8, step=1, interactive=True)
64
  verbose = gr.Checkbox(label="Verbose", value=True, interactive=True)
65
  f16_kv = gr.Checkbox(label="F16 KV", value=True, interactive=True)
 
69
  use_mlock = gr.Checkbox(label="Use mlock", value=False, interactive=True)
70
  n_batch = gr.Slider(label="Number of batch", minimum=128, maximum=2048, value=512, step=8, interactive=True)
71
  last_n_tokens_size = gr.Slider(label="Last number of tokens size", minimum=8, maximum=512, value=64, step=8, interactive=True)
72
+ low_vram = gr.Checkbox(label="Low VRAM", value=lowvram_arg, interactive=False)
73
  rope_freq_base = gr.Slider(label="Rope freq base", minimum=1000.0, maximum=30000.0, value=10000.0, step=0.1, interactive=True)
74
  rope_freq_scale = gr.Slider(label="Rope freq scale", minimum=0.1, maximum=3.0, value=1.0, step=0.1)
75