{
  "_from_model_config": true,
  "bos_token_id": 1,
  "eos_token_id": 2,
  "pad_token_id": 0,
  "transformers_version": "4.35.2",
  
  "max_length": 512,            // Limits the length of the output text
  "temperature": 0.7,           // Controls randomness, higher means more random
  "top_p": 0.9,                 // Nucleus sampling, considers only top_p highest probability tokens
  "top_k": 50,                  // Limits the sample space to top_k tokens with highest probabilities
  "do_sample": true,            // Enables sampling instead of greedy decoding
  "repetition_penalty": 1.2,    // Penalizes repetition
  "num_return_sequences": 1     // Number of output sequences to generate
}