temperature
top_k
top_p
frequency_penalty
payload = { "model": "Qwen/Qwen2.5-Math-72B-Instruct", "messages": [ { "role": "user", "content": "1+1=?", } ], "max_tokens": 200, # 按需添加 "temperature": 0.7, # 按需添加 "top_k": 50, # 按需添加 "top_p": 0.7, # 按需添加 "frequency_penalty": 0 # 按需添加 }
max_tokens
上下文长度
context_length