RinInori commited on
Commit
c31cb2d
1 Parent(s): 04ec6d0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -6
app.py CHANGED
@@ -12,12 +12,11 @@ BASE_MODEL = "TheBloke/stable-vicuna-13B-HF"
12
  device_map = {0: [0, 1, 2], 1: [3, 4, 5]}
13
 
14
  model = LlamaForCausalLM.from_pretrained(
15
- BASE_MODEL,
16
- load_in_8bit=True,
17
- load_in_8bit_fp32_cpu_offload=True,
18
- torch_dtype=torch.float16,
19
- device_map=device_map,
20
- offload_folder="./cache"
21
  )
22
 
23
  tokenizer = LlamaTokenizer.from_pretrained(BASE_MODEL)
 
12
  device_map = {0: [0, 1, 2], 1: [3, 4, 5]}
13
 
14
  model = LlamaForCausalLM.from_pretrained(
15
+ MODEL_NAME,
16
+ torch_dtype=torch.float16,
17
+ load_in_8bit=True,
18
+ device_map="auto",
19
+ offload_folder="./cache",
 
20
  )
21
 
22
  tokenizer = LlamaTokenizer.from_pretrained(BASE_MODEL)