muryshev commited on
Commit
4b0ae5d
1 Parent(s): 47b6c1e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -16,7 +16,7 @@ ROLE_TOKENS = {
16
  "system": SYSTEM_TOKEN
17
  }
18
 
19
- CONTEXT_SIZE = 4096
20
 
21
  # Create a lock object
22
  lock = threading.Lock()
@@ -47,7 +47,7 @@ model = Llama(
47
  logits_all=True,
48
  #n_threads=12,
49
  verbose=True,
50
- n_gpu_layers=30,
51
  n_gqa=8 #must be set for 70b models
52
  )
53
 
 
16
  "system": SYSTEM_TOKEN
17
  }
18
 
19
+ CONTEXT_SIZE = 3000
20
 
21
  # Create a lock object
22
  lock = threading.Lock()
 
47
  logits_all=True,
48
  #n_threads=12,
49
  verbose=True,
50
+ n_gpu_layers=35,
51
  n_gqa=8 #must be set for 70b models
52
  )
53