Docfile commited on
Commit
45eedc1
·
1 Parent(s): a0a57e5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -4
app.py CHANGED
@@ -21,14 +21,15 @@ from langchain import PromptTemplate, LLMChain
21
  model_name_or_path = "hlhr202/llama-7B-ggml-int4"
22
  model_basename = "ggml-model-q4_0.bin" # the model is in bin format
23
 
24
- model_path = hf_hub_download(repo_id=model_name_or_path, filename=model_basename)
25
 
26
  n_gpu_layers = 40 # Change this value based on your model and your GPU VRAM pool.
27
  n_batch = 256
28
 
29
- llm = LlamaCpp(
30
- model_path=model_path, callbacks=[StreamingStdOutCallbackHandler()]
31
- )
 
32
 
33
  #llm = LLM = G4FLLM(model=models.gpt_35_turbo,provider=Provider.DeepAi,)
34
 
 
21
  model_name_or_path = "hlhr202/llama-7B-ggml-int4"
22
  model_basename = "ggml-model-q4_0.bin" # the model is in bin format
23
 
24
+ #model_path = hf_hub_download(repo_id=model_name_or_path, filename=model_basename)
25
 
26
  n_gpu_layers = 40 # Change this value based on your model and your GPU VRAM pool.
27
  n_batch = 256
28
 
29
+ llm = LLM = G4FLLM(
30
+ model=models.gpt_35_turbo,
31
+ provider=Provider.Acytoo,
32
+ )
33
 
34
  #llm = LLM = G4FLLM(model=models.gpt_35_turbo,provider=Provider.DeepAi,)
35