route.py 1.3 KB

12345678910111213141516171819202122232425262728293031323334353637
  1. from fastapi import FastAPI
  2. from pydantic import BaseModel
  3. app = FastAPI()
  4. import json
  5. from openai import OpenAI
  6. qwclient = OpenAI(
  7. # 若没有配置环境变量,请用百炼API Key将下行替换为:api_key="sk-xxx",
  8. #api_key=os.getenv("DASHSCOPE_API_KEY"),
  9. api_key='ms-0edcfe5e-0d1f-4092-ac17-7c6f69127731',
  10. #base_url="https://dashscope.aliyuncs.com/compatible-mode/v1",
  11. base_url="https://api-inference.modelscope.cn/v1/",
  12. timeout=60
  13. )
  14. class Task(BaseModel):
  15. content: str
  16. @app.post("/ask/")
  17. async def submit(r: Task):
  18. content = json.loads(r.content)
  19. completion = qwclient.chat.completions.create(
  20. # 模型列表:https://help.aliyun.com/zh/model-studio/getting-started/models
  21. #model="glm-4.5-flash",
  22. model="Qwen/Qwen3-32B",
  23. messages=content,
  24. # Qwen3模型通过enable_thinking参数控制思考过程(开源版默认True,商业版默认False)
  25. # 使用Qwen3开源版模型时,若未启用流式输出,请将下行取消注释,否则会报错
  26. extra_body={"enable_thinking": False},
  27. #extra_body={"thinking": {"type": "disabled"}},
  28. )
  29. json_string = completion.choices[0].message.content
  30. print(json_string)
  31. return {"answer": json_string}