do_sample=True,
max_new_tokens=tokens,
top_p=1.0,
top_k=100,
temperature=1.07,
repetition_penalty=1.05,
typical_p=1.0,