rphrp1985 commited on
Commit
16e49b4
1 Parent(s): 126e605

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -0
app.py CHANGED
@@ -7,6 +7,14 @@ import os
7
  """
8
  For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
9
  """
 
 
 
 
 
 
 
 
10
  client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
11
  # pip install 'git+https://github.com/huggingface/transformers.git'
12
 
 
7
  """
8
  For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
9
  """
10
+
11
+
12
+ subprocess.run(
13
+ "pip install flash-attn --no-build-isolation",
14
+ env={"FLASH_ATTENTION_SKIP_CUDA_BUILD": "TRUE"},
15
+ shell=True,
16
+ )
17
+
18
  client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
19
  # pip install 'git+https://github.com/huggingface/transformers.git'
20