{
  "chat_format": "chatml",
  "do_sample": false,                  // Disable sampling for faster inference
  "eos_token_id": 151643,
  "max_new_tokens": 256,               // Reduce the number of tokens to generate
  "max_window_size": 6144,
  "pad_token_id": 151643,
  "top_k": 50,                         // Use a reasonable value for top_k
  "top_p": 0.9,                        // Increase top_p to allow more tokens
  "transformers_version": "4.31.0"
}