Update handler.py
Browse files- handler.py +3 -2
handler.py
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
|
2 |
-
import torch
|
3 |
import os
|
4 |
|
5 |
class EndpointHandler:
|
@@ -16,7 +16,8 @@ class EndpointHandler:
|
|
16 |
model_name,
|
17 |
device_map="auto",
|
18 |
torch_dtype=torch.float16,
|
19 |
-
offload_folder=offload_dir
|
|
|
20 |
)
|
21 |
self.tokenizer = AutoTokenizer.from_pretrained(model_name)
|
22 |
|
|
|
1 |
from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
|
2 |
+
import torch
|
3 |
import os
|
4 |
|
5 |
class EndpointHandler:
|
|
|
16 |
model_name,
|
17 |
device_map="auto",
|
18 |
torch_dtype=torch.float16,
|
19 |
+
offload_folder=offload_dir,
|
20 |
+
offload_state_dict=True # เพิ่มพารามิเตอร์นี้เพื่อจัดการการ offload ให้ดียิ่งขึ้น
|
21 |
)
|
22 |
self.tokenizer = AutoTokenizer.from_pretrained(model_name)
|
23 |
|