chat_format="llama-2" ) res = llm.create_chat_completion( messages = [ {"role": "system", "content": "You are a helpful assistant."}, { "role": "user", "content": "来一段金瓶梅风格的情感小说,100字,别太露骨了" } ],stream=True ) for chunk in res:...