Update app.py
Browse files
app.py
CHANGED
@@ -25,7 +25,7 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
25 |
model_name,
|
26 |
quantization_config=quantization_config,
|
27 |
device_map="auto",
|
28 |
-
max_memory={0: "22GiB", "cpu": "6GiB"} # Prevent VRAM overflow
|
29 |
)
|
30 |
text_generator = pipeline("text-generation", model=model, tokenizer=tokenizer)
|
31 |
|
|
|
25 |
model_name,
|
26 |
quantization_config=quantization_config,
|
27 |
device_map="auto",
|
28 |
+
max_memory={0: "22GiB", "cpu": "6GiB"} # Prevent VRAM overflow
|
29 |
)
|
30 |
text_generator = pipeline("text-generation", model=model, tokenizer=tokenizer)
|
31 |
|