yuhaofeng-shiba commited on
Commit
492f975
1 Parent(s): aed5af0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -7,6 +7,8 @@ from models.tokenize import Tokenizer
7
  from models.llama import *
8
  from generate import LmGeneration
9
 
 
 
10
 
11
  args = None
12
  lm_generation = None
@@ -22,7 +24,7 @@ def init_args():
22
  args.batch_size = 1
23
  args.seq_length = 512
24
  args.world_size = 1
25
- args.use_int8 = True
26
  args.top_p = 0
27
  args.repetition_penalty_range = 1024
28
  args.repetition_penalty_slope = 0
 
7
  from models.llama import *
8
  from generate import LmGeneration
9
 
10
+ import os
11
+ os.environ['CUDA_LAUNCH_BLOCKING'] = '1'
12
 
13
  args = None
14
  lm_generation = None
 
24
  args.batch_size = 1
25
  args.seq_length = 512
26
  args.world_size = 1
27
+ args.use_int8 = False
28
  args.top_p = 0
29
  args.repetition_penalty_range = 1024
30
  args.repetition_penalty_slope = 0