{ "temperature": 0.7, "top_p": 0.9, "max_new_tokens": 4096, "stop": [ "<|im_start|>", "<|im_end|>", "user", "assistant" ] }