forcemultiplier
/

gpqa-syngen-gemma2-2b

fullstack commited on Oct 4, 2024

Commit

63c0baf

verified ·

1 Parent(s): 1a821d0

Upload folder using huggingface_hub

Files changed (1) hide show

run_vllm_2b.sh CHANGED Viewed

@@ -6,6 +6,6 @@ VLLM_ALLOW_RUNTIME_LORA_UPDATING=1 VLLM_ALLOW_LONG_MAX_MODEL_LEN=1 vllm serve ~/
   --max-model-len 8192 \
   --disable-log-requests \
   --enable-lora \
-  --lora-modules gpqa=./gpqa \
-  # --guided-decoding-backend lm-format-enforcer \

   --max-model-len 8192 \
   --disable-log-requests \
   --enable-lora \
+  --lora-modules gpqa=./ \
+  # --guided-decoding-backend lm-format-enforcer \