do_sample=True, max_new_tokens=tokens, top_p=0.9, top_k=50, temperature=1.39, repetition_penalty=1.08, typical_p=0.2,