Spaces:

seanpedrickcase
/

Light-PDF-Web-QA-Chatbot

Running

Sean-Case commited on Oct 16, 2023

Commit

8249fd3

•

1 Parent(s): 994ad90

Made GPU layer bar invisible. Changed default GPU layers when CUDA available

Files changed (2) hide show

app.py CHANGED Viewed

@@ -80,9 +80,11 @@ def load_model(model_type, gpu_layers, gpu_config=None, cpu_config=None, torch_d
         torch_device = chatf.torch_device
     if model_type == "Mistral Open Orca (larger, slow)":
-        gpu_config.update_gpu(gpu_layers)
-        cpu_config.update_gpu(gpu_layers)
         print("Loading with", cpu_config.gpu_layers, "model layers sent to GPU.")
@@ -231,7 +233,7 @@ with block:
     with gr.Tab("Advanced features"):
         model_choice = gr.Radio(label="Choose a chat model", value="Flan Alpaca (small, fast)", choices = ["Flan Alpaca (small, fast)", "Mistral Open Orca (larger, slow)"])
         with gr.Row():
-            gpu_layer_choice = gr.Slider(label="Choose number of model layers to send to GPU (WARNING: please don't modify unless you have a GPU).", value=0, minimum=0, maximum=5, step = 1, visible=True)
             change_model_button = gr.Button(value="Load model", scale=0)
         load_text = gr.Text(label="Load status")

         torch_device = chatf.torch_device
     if model_type == "Mistral Open Orca (larger, slow)":
+        if torch_device == "cuda":
+            gpu_config.update_gpu(12)
+        else:
+            gpu_config.update_gpu(gpu_layers)
+            cpu_config.update_gpu(gpu_layers)
         print("Loading with", cpu_config.gpu_layers, "model layers sent to GPU.")
     with gr.Tab("Advanced features"):
         model_choice = gr.Radio(label="Choose a chat model", value="Flan Alpaca (small, fast)", choices = ["Flan Alpaca (small, fast)", "Mistral Open Orca (larger, slow)"])
         with gr.Row():
+            gpu_layer_choice = gr.Slider(label="Choose number of model layers to send to GPU (WARNING: please don't modify unless you have a GPU).", value=0, minimum=0, maximum=5, step = 1, visible=False)
             change_model_button = gr.Button(value="Load model", scale=0)
         load_text = gr.Text(label="Load status")

chatfuncs/chatfuncs.py CHANGED Viewed

@@ -69,7 +69,7 @@ kw_model = pipeline("feature-extraction", model="sentence-transformers/all-MiniL
 if torch.cuda.is_available():
     torch_device = "cuda"
-    gpu_layers = 0
 else:
     torch_device =  "cpu"
     gpu_layers = 0

 if torch.cuda.is_available():
     torch_device = "cuda"
+    gpu_layers = 12
 else:
     torch_device =  "cpu"
     gpu_layers = 0