do_sample=True,
max_new_tokens=max_length,
top_p=1,
typical_p=0.3,
temperature=0.7,
