Spaces:

dkdaniz
/

katara

Paused

dkdaniz commited on Oct 14, 2023

Commit

ecf5eb4

1 Parent(s): d13603d

Update constants.py

Files changed (1) hide show

constants.py CHANGED Viewed

@@ -33,8 +33,8 @@ MAX_NEW_TOKENS = CONTEXT_WINDOW_SIZE  # int(CONTEXT_WINDOW_SIZE/4)
 #### If you get a "not enough space in the buffer" error, you should reduce the values below, start with half of the original values and keep halving the value until the error stops appearing
-N_GPU_LAYERS = 8  # Llama-2-70B has 83 layers
-N_BATCH = 16
 ### From experimenting with the Llama-2-7B-Chat-GGML model on 8GB VRAM, these values work:
 # N_GPU_LAYERS = 20
@@ -56,7 +56,7 @@ DOCUMENT_MAP = {
 }
 # Default Instructor Model
-#EMBEDDING_MODEL_NAME = "hkunlp/instructor-large"  # Uses 1.5 GB of VRAM (High Accuracy with lower VRAM usage)
 ####
 #### OTHER EMBEDDING MODEL OPTIONS
@@ -71,7 +71,7 @@ DOCUMENT_MAP = {
 #### MULTILINGUAL EMBEDDING MODELS
 ####
-EMBEDDING_MODEL_NAME = "intfloat/multilingual-e5-large" # Uses 2.5 GB of VRAM
 # EMBEDDING_MODEL_NAME = "intfloat/multilingual-e5-base" # Uses 1.2 GB of VRAM

 #### If you get a "not enough space in the buffer" error, you should reduce the values below, start with half of the original values and keep halving the value until the error stops appearing
+N_GPU_LAYERS = 20  # Llama-2-70B has 83 layers
+N_BATCH = 512
 ### From experimenting with the Llama-2-7B-Chat-GGML model on 8GB VRAM, these values work:
 # N_GPU_LAYERS = 20
 }
 # Default Instructor Model
+EMBEDDING_MODEL_NAME = "hkunlp/instructor-large"  # Uses 1.5 GB of VRAM (High Accuracy with lower VRAM usage)
 ####
 #### OTHER EMBEDDING MODEL OPTIONS
 #### MULTILINGUAL EMBEDDING MODELS
 ####
+# EMBEDDING_MODEL_NAME = "intfloat/multilingual-e5-large" # Uses 2.5 GB of VRAM
 # EMBEDDING_MODEL_NAME = "intfloat/multilingual-e5-base" # Uses 1.2 GB of VRAM