oleksandrfluxon commited on
Commit
641be9d
1 Parent(s): 594d449

Update pipeline.py

Browse files
Files changed (1) hide show
  1. pipeline.py +2 -2
pipeline.py CHANGED
@@ -14,8 +14,8 @@ class PreTrainedPipeline():
14
  path,
15
  trust_remote_code=True
16
  )
17
- config.attn_config['attn_impl'] = 'triton'
18
- config.init_device = 'cuda:0' # For fast initialization directly on GPU!
19
  config.max_seq_len = 4096 # (input + output) tokens can now be up to 4096
20
 
21
  print("===> loading model")
 
14
  path,
15
  trust_remote_code=True
16
  )
17
+ # config.attn_config['attn_impl'] = 'triton'
18
+ # config.init_device = 'cuda:0' # For fast initialization directly on GPU!
19
  config.max_seq_len = 4096 # (input + output) tokens can now be up to 4096
20
 
21
  print("===> loading model")