重构初始化逻辑以支持根据环境选择不同的LLM模型
This commit is contained in:
@@ -7,25 +7,27 @@ from langchain_qwq import ChatQwen
|
|||||||
load_dotenv()
|
load_dotenv()
|
||||||
|
|
||||||
QWEN_API_KEY_INTL = os.environ.get("QWEN_API_KEY_INTL", "")
|
QWEN_API_KEY_INTL = os.environ.get("QWEN_API_KEY_INTL", "")
|
||||||
|
SERVE_ENV = os.environ.get("SERVE_ENV", "dev") # prod 使用 Qwen API,dev 使用本地 Ollama
|
||||||
|
|
||||||
|
|
||||||
def build_llm(enable_thinking: bool = False):
|
def build_llm(enable_thinking: bool = False):
|
||||||
# llm = ChatQwen(
|
if SERVE_ENV == "prod":
|
||||||
# model="qwen3.6-plus",
|
llm = ChatQwen(
|
||||||
# timeout=None,
|
model="qwen3.6-plus",
|
||||||
# max_retries=2,
|
timeout=None,
|
||||||
# enable_thinking=enable_thinking,
|
max_retries=2,
|
||||||
# streaming=True,
|
enable_thinking=enable_thinking,
|
||||||
# api_key=QWEN_API_KEY_INTL,
|
streaming=True,
|
||||||
# )
|
api_key=QWEN_API_KEY_INTL,
|
||||||
# return llm
|
)
|
||||||
llm = ChatOllama(
|
else:
|
||||||
model="qwen3.6:27b",
|
llm = ChatOllama(
|
||||||
base_url="http://127.0.0.1:11434",
|
model="qwen3.6:27b",
|
||||||
reasoning=enable_thinking, # 核心:开启思考,自动拆分reasoning_content
|
base_url="http://127.0.0.1:11434",
|
||||||
temperature=0.7,
|
reasoning=enable_thinking,
|
||||||
num_ctx=32768,
|
temperature=0.7,
|
||||||
)
|
num_ctx=32768,
|
||||||
|
)
|
||||||
return llm
|
return llm
|
||||||
|
|
||||||
|
|
||||||
@@ -42,8 +44,19 @@ def build_llm(enable_thinking: bool = False):
|
|||||||
# print(response)
|
# print(response)
|
||||||
|
|
||||||
|
|
||||||
qwen_plus_llm = ChatOllama(
|
if SERVE_ENV == "prod":
|
||||||
model="qwen3.6:27b", base_url="http://127.0.0.1:11434", reasoning=False, temperature=0.7, num_ctx=32768, extra_kwargs={"stream": False}
|
qwen_plus_llm = ChatQwen(
|
||||||
)
|
model="qwen-plus",
|
||||||
|
timeout=None,
|
||||||
|
max_retries=2,
|
||||||
|
streaming=False,
|
||||||
|
temperature=0.25,
|
||||||
|
top_p=0.8,
|
||||||
|
api_key=QWEN_API_KEY_INTL,
|
||||||
|
)
|
||||||
|
else:
|
||||||
|
qwen_plus_llm = ChatOllama(
|
||||||
|
model="qwen3.6:27b", base_url="http://127.0.0.1:11434", reasoning=False, temperature=0.7, num_ctx=32768, extra_kwargs={"stream": False}
|
||||||
|
)
|
||||||
# for chunk in qwen_plus_llm.stream("你好"):
|
# for chunk in qwen_plus_llm.stream("你好"):
|
||||||
# print(chunk)
|
# print(chunk)
|
||||||
|
|||||||
Reference in New Issue
Block a user