Update main.py
Browse files
main.py
CHANGED
@@ -21,9 +21,9 @@ embeddingModel = AutoModel.from_pretrained('./multilingual-e5-base')
|
|
21 |
|
22 |
# chatGpt replacement
|
23 |
inferenceTokenizer = AutoTokenizer.from_pretrained(
|
24 |
-
"./ct2fast-flan-alpaca-
|
25 |
inferenceTranslator = Translator(
|
26 |
-
"./ct2fast-flan-alpaca-
|
27 |
|
28 |
|
29 |
class EmbeddingRequest(BaseModel):
|
|
|
21 |
|
22 |
# chatGpt replacement
|
23 |
inferenceTokenizer = AutoTokenizer.from_pretrained(
|
24 |
+
"./ct2fast-flan-alpaca-xl")
|
25 |
inferenceTranslator = Translator(
|
26 |
+
"./ct2fast-flan-alpaca-xl", compute_type="int8", device="cpu", inter_threads=1, intra_threads=2)
|
27 |
|
28 |
|
29 |
class EmbeddingRequest(BaseModel):
|