do_sample=True, max_new_tokens=tokens, top_p=0.98, top_k=0, temperature=0.63, repetition_penalty=1.05, typical_p=1.0,