oleksandrfluxon
commited on
Commit
•
641be9d
1
Parent(s):
594d449
Update pipeline.py
Browse files- pipeline.py +2 -2
pipeline.py
CHANGED
@@ -14,8 +14,8 @@ class PreTrainedPipeline():
|
|
14 |
path,
|
15 |
trust_remote_code=True
|
16 |
)
|
17 |
-
config.attn_config['attn_impl'] = 'triton'
|
18 |
-
config.init_device = 'cuda:0' # For fast initialization directly on GPU!
|
19 |
config.max_seq_len = 4096 # (input + output) tokens can now be up to 4096
|
20 |
|
21 |
print("===> loading model")
|
|
|
14 |
path,
|
15 |
trust_remote_code=True
|
16 |
)
|
17 |
+
# config.attn_config['attn_impl'] = 'triton'
|
18 |
+
# config.init_device = 'cuda:0' # For fast initialization directly on GPU!
|
19 |
config.max_seq_len = 4096 # (input + output) tokens can now be up to 4096
|
20 |
|
21 |
print("===> loading model")
|