SparseLlama-3.1-8B-gsm8k-pruned.2of4-tensor_weights_per_token_dynamic_act_fp8-BitMaskCompressed
/
generation_config.json
{ | |
"_from_model_config": true, | |
"bos_token_id": 128000, | |
"do_sample": true, | |
"eos_token_id": 128001, | |
"temperature": 0.6, | |
"top_p": 0.9, | |
"transformers_version": "4.46.3" | |
} | |