This commit is contained in:
zcr
2026-06-17 11:58:06 +08:00
parent 44cd88e8af
commit 13d93088e7

View File

@@ -1,6 +1,7 @@
import os import os
from dotenv import load_dotenv from dotenv import load_dotenv
from langchain_ollama import ChatOllama
from langchain_qwq import ChatQwen from langchain_qwq import ChatQwen
load_dotenv() load_dotenv()
@@ -9,25 +10,40 @@ QWEN_API_KEY_INTL = os.environ.get("QWEN_API_KEY_INTL", "")
def build_llm(enable_thinking: bool = False): def build_llm(enable_thinking: bool = False):
llm = ChatQwen( # llm = ChatQwen(
model="qwen3.6-plus", # model="qwen3.6-plus",
timeout=None, # timeout=None,
max_retries=2, # max_retries=2,
enable_thinking=enable_thinking, # enable_thinking=enable_thinking,
streaming=True, # streaming=True,
api_key=QWEN_API_KEY_INTL, # api_key=QWEN_API_KEY_INTL,
# )
# return llm
llm = ChatOllama(
model="qwen3.6:27b",
base_url="http://127.0.0.1:11434",
reasoning=enable_thinking, # 核心开启思考自动拆分reasoning_content
temperature=0.7,
num_ctx=32768,
) )
return llm return llm
qwen_plus_llm = ChatQwen( # qwen_plus_llm = ChatQwen(
model="qwen-plus", # model="qwen-plus",
timeout=None, # timeout=None,
max_retries=2, # max_retries=2,
streaming=False, # streaming=False,
temperature=0.25, # temperature=0.25,
top_p=0.8, # top_p=0.8,
api_key=QWEN_API_KEY_INTL, # api_key=QWEN_API_KEY_INTL,
) # )
# response = qwen_plus_llm.invoke("你好") # response = qwen_plus_llm.invoke("你好")
# print(response) # print(response)
qwen_plus_llm = ChatOllama(
model="qwen3.6:27b", base_url="http://127.0.0.1:11434", reasoning=False, temperature=0.7, num_ctx=32768, extra_kwargs={"stream": False}
)
# for chunk in qwen_plus_llm.stream("你好"):
# print(chunk)