BlinkDL commited on
Commit
0fe023b
1 Parent(s): 73d375b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -6,7 +6,7 @@ from pynvml import *
6
  nvmlInit()
7
  gpu_h = nvmlDeviceGetHandleByIndex(0)
8
  ctx_limit = 2048
9
- title = "RWKV-4-Pile-14B-20230228-ctx4096-test663"
10
  desc = f'''Links:
11
  <a href='https://github.com/BlinkDL/ChatRWKV' target="_blank" style="margin:0 0.5em">ChatRWKV</a>
12
  <a href='https://github.com/BlinkDL/RWKV-LM' target="_blank" style="margin:0 0.5em">RWKV-LM</a>
@@ -17,7 +17,7 @@ os.environ["RWKV_JIT_ON"] = '1'
17
  os.environ["RWKV_CUDA_ON"] = '1' # if '1' then use CUDA kernel for seq mode (much faster)
18
 
19
  from rwkv.model import RWKV
20
- model_path = hf_hub_download(repo_id="BlinkDL/rwkv-4-pile-14b", filename="RWKV-4-Pile-14B-20230228-ctx4096-test663.pth")
21
  model = RWKV(model=model_path, strategy='cuda fp16i8 *20 -> cuda fp16')
22
  from rwkv.utils import PIPELINE, PIPELINE_ARGS
23
  pipeline = PIPELINE(model, "20B_tokenizer.json")
 
6
  nvmlInit()
7
  gpu_h = nvmlDeviceGetHandleByIndex(0)
8
  ctx_limit = 2048
9
+ title = "RWKV-4-Pile-14B-20230313-ctx8192-test1050"
10
  desc = f'''Links:
11
  <a href='https://github.com/BlinkDL/ChatRWKV' target="_blank" style="margin:0 0.5em">ChatRWKV</a>
12
  <a href='https://github.com/BlinkDL/RWKV-LM' target="_blank" style="margin:0 0.5em">RWKV-LM</a>
 
17
  os.environ["RWKV_CUDA_ON"] = '1' # if '1' then use CUDA kernel for seq mode (much faster)
18
 
19
  from rwkv.model import RWKV
20
+ model_path = hf_hub_download(repo_id="BlinkDL/rwkv-4-pile-14b", filename=f"{title}.pth")
21
  model = RWKV(model=model_path, strategy='cuda fp16i8 *20 -> cuda fp16')
22
  from rwkv.utils import PIPELINE, PIPELINE_ARGS
23
  pipeline = PIPELINE(model, "20B_tokenizer.json")