amir22010 commited on
Commit
016850e
1 Parent(s): 7ea5fab

added cache

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -6,6 +6,8 @@ llm = Llama.from_pretrained(
6
  repo_id="amir22010/fine_tuned_product_marketing_email_gemma_2_9b_q4_k_m",
7
  filename="unsloth.Q4_K_M.gguf",
8
  cache_dir=os.path.abspath(os.getcwd()),
 
 
9
  verbose=False
10
  )
11
 
@@ -37,7 +39,7 @@ def greet(product,description):
37
  # response_format={
38
  # "type": "json_object",
39
  # },
40
- max_tokens=8192,
41
  temperature=0.7,
42
  stream=True
43
  )
 
6
  repo_id="amir22010/fine_tuned_product_marketing_email_gemma_2_9b_q4_k_m",
7
  filename="unsloth.Q4_K_M.gguf",
8
  cache_dir=os.path.abspath(os.getcwd()),
9
+ n_ctx=2048,
10
+ n_batch=126,
11
  verbose=False
12
  )
13
 
 
39
  # response_format={
40
  # "type": "json_object",
41
  # },
42
+ max_tokens=4096,
43
  temperature=0.7,
44
  stream=True
45
  )