yuhaofeng-shiba commited on
Commit
784d667
1 Parent(s): 2598f17

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -4
app.py CHANGED
@@ -20,7 +20,7 @@ def init_args():
20
  args.config_path = './config/llama_7b.json'
21
  args.spm_model_path = './model_file/tokenizer.model'
22
  args.batch_size = 1
23
- args.seq_length = 512
24
  args.world_size = 1
25
  args.use_int8 = True
26
  args.top_p = 0
@@ -42,9 +42,6 @@ def init_model():
42
  model = load_model(model, args.load_model_path)
43
  model.eval()
44
 
45
- # for name, parameter in model.named_parameters():
46
- # print(name)
47
- # print(parameter)
48
  print(torch.cuda.max_memory_allocated() / 1024 ** 3)
49
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
50
  model.to(device)
 
20
  args.config_path = './config/llama_7b.json'
21
  args.spm_model_path = './model_file/tokenizer.model'
22
  args.batch_size = 1
23
+ args.seq_length = 256
24
  args.world_size = 1
25
  args.use_int8 = True
26
  args.top_p = 0
 
42
  model = load_model(model, args.load_model_path)
43
  model.eval()
44
 
 
 
 
45
  print(torch.cuda.max_memory_allocated() / 1024 ** 3)
46
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
47
  model.to(device)