mnauf
commited on
Commit
•
0a57ca5
1
Parent(s):
b98d5cd
first commit
Browse files
app.py
CHANGED
@@ -49,5 +49,5 @@ with gr.Blocks() as block:
|
|
49 |
outputs=outputs,
|
50 |
queue=True
|
51 |
)
|
52 |
-
block.queue(concurrency_count=5).launch(server_name="localhost", share=True)
|
53 |
-
|
|
|
49 |
outputs=outputs,
|
50 |
queue=True
|
51 |
)
|
52 |
+
# block.queue(concurrency_count=5).launch(server_name="localhost", share=True)
|
53 |
+
block.queue().launch()
|
sample.py
CHANGED
@@ -17,9 +17,9 @@ max_new_tokens = 500 # number of tokens generated in each sample
|
|
17 |
temperature = 0.8 # 1.0 = no change, < 1.0 = less random, > 1.0 = more random, in predictions
|
18 |
top_k = 200 # retain only the top_k most likely tokens, clamp others to have 0 probability
|
19 |
seed = 1337
|
20 |
-
device = '
|
21 |
dtype = 'bfloat16' # 'float32' or 'bfloat16' or 'float16'
|
22 |
-
compile =
|
23 |
exec(open('configurator.py').read()) # overrides from command line or config file
|
24 |
# -----------------------------------------------------------------------------
|
25 |
|
|
|
17 |
temperature = 0.8 # 1.0 = no change, < 1.0 = less random, > 1.0 = more random, in predictions
|
18 |
top_k = 200 # retain only the top_k most likely tokens, clamp others to have 0 probability
|
19 |
seed = 1337
|
20 |
+
device = 'cpu' # examples: 'cpu', 'cuda', 'cuda:0', 'cuda:1', etc.
|
21 |
dtype = 'bfloat16' # 'float32' or 'bfloat16' or 'float16'
|
22 |
+
compile = True # use PyTorch 2.0 to compile the model to be faster
|
23 |
exec(open('configurator.py').read()) # overrides from command line or config file
|
24 |
# -----------------------------------------------------------------------------
|
25 |
|