herMaster commited on
Commit
832c3db
1 Parent(s): 763ab45

max_new_tokens update

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -38,7 +38,8 @@ llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGUF",
38
  model_file="llama-2-7b-chat.Q3_K_S.gguf",
39
  model_type="llama",
40
  temperature = 0.2,
41
- repetition_penalty = 1.5
 
42
  )
43
 
44
 
 
38
  model_file="llama-2-7b-chat.Q3_K_S.gguf",
39
  model_type="llama",
40
  temperature = 0.2,
41
+ repetition_penalty = 1.5,
42
+ max_new_tokens = 300,
43
  )
44
 
45