yuhaofeng-shiba commited on
Commit
9f88a9b
·
1 Parent(s): b28b3e5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -22,7 +22,7 @@ def init_args():
22
  args.batch_size = 1
23
  args.seq_length = 512
24
  args.world_size = 1
25
- args.use_int8 = False
26
  args.top_p = 0
27
  args.repetition_penalty_range = 1024
28
  args.repetition_penalty_slope = 0
@@ -40,11 +40,12 @@ def init_model():
40
  model = LLaMa(args)
41
  torch.set_default_tensor_type(torch.FloatTensor)
42
  model = load_model(model, args.load_model_path)
43
- print('done load model.')
44
  model.eval()
45
 
46
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
47
  model.to(device)
 
48
  lm_generation = LmGeneration(model, args.tokenizer)
49
 
50
 
 
22
  args.batch_size = 1
23
  args.seq_length = 512
24
  args.world_size = 1
25
+ args.use_int8 = True
26
  args.top_p = 0
27
  args.repetition_penalty_range = 1024
28
  args.repetition_penalty_slope = 0
 
40
  model = LLaMa(args)
41
  torch.set_default_tensor_type(torch.FloatTensor)
42
  model = load_model(model, args.load_model_path)
43
+ print('load model done.')
44
  model.eval()
45
 
46
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
47
  model.to(device)
48
+ print('to cuda.')
49
  lm_generation = LmGeneration(model, args.tokenizer)
50
 
51