dingckc commited on
Commit
a4ad8e2
·
verified ·
1 Parent(s): 5b8d2f7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -3,10 +3,12 @@ import gradio as gr
3
  from transformers import AutoTokenizer, AutoModelForCausalLM
4
  import torch
5
 
 
 
6
  # 設置模型 ID 和加載 Hugging Face API token
7
  model_id = "dingckc/FineLlama-3.1-8B"
8
  tokenizer = AutoTokenizer.from_pretrained(model_id, token=os.getenv('ACCESS_KEY'))
9
- model = AutoModelForCausalLM.from_pretrained(model_id, token=os.getenv('ACCESS_KEY'))
10
  model = model.to("cuda" if torch.cuda.is_available() else "cpu")
11
 
12
  # 定義推理函數
 
3
  from transformers import AutoTokenizer, AutoModelForCausalLM
4
  import torch
5
 
6
+ import bitsandbytes as bnb
7
+
8
  # 設置模型 ID 和加載 Hugging Face API token
9
  model_id = "dingckc/FineLlama-3.1-8B"
10
  tokenizer = AutoTokenizer.from_pretrained(model_id, token=os.getenv('ACCESS_KEY'))
11
+ model = AutoModelForCausalLM.from_pretrained(model_id, load_in_8bit=True, token=os.getenv('ACCESS_KEY'))
12
  model = model.to("cuda" if torch.cuda.is_available() else "cpu")
13
 
14
  # 定義推理函數