Procházet zdrojové kódy

Fix: Qwen-vl-plus url error (#7281)

### What problem does this PR solve?

Fix Qwen-vl-* url error. #7277

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
tags/v0.19.0
Yongteng Lei před 6 měsíci
rodič
revize
97a13ef1ab
Žádný účet není propojen s e-mailovou adresou tvůrce revize
1 změnil soubory, kde provedl 3 přidání a 3 odebrání
  1. 3
    3
      rag/llm/chat_model.py

+ 3
- 3
rag/llm/chat_model.py Zobrazit soubor

@@ -565,7 +565,7 @@ class QWenChat(Base):

dashscope.api_key = key
self.model_name = model_name
if self.is_reasoning_model(self.model_name):
if self.is_reasoning_model(self.model_name) or self.model_name in ["qwen-vl-plus", "qwen-vl-plus-latest", "qwen-vl-max", "qwen-vl-max-latest"]:
super().__init__(key, model_name, "https://dashscope.aliyuncs.com/compatible-mode/v1")

def chat_with_tools(self, system: str, history: list, gen_conf: dict) -> tuple[str, int]:
@@ -643,7 +643,7 @@ class QWenChat(Base):
def chat(self, system, history, gen_conf):
if "max_tokens" in gen_conf:
del gen_conf["max_tokens"]
if self.is_reasoning_model(self.model_name):
if self.is_reasoning_model(self.model_name) or self.model_name in ["qwen-vl-plus", "qwen-vl-plus-latest", "qwen-vl-max", "qwen-vl-max-latest"]:
return super().chat(system, history, gen_conf)

stream_flag = str(os.environ.get("QWEN_CHAT_BY_STREAM", "true")).lower() == "true"
@@ -811,7 +811,7 @@ class QWenChat(Base):
def chat_streamly(self, system, history, gen_conf):
if "max_tokens" in gen_conf:
del gen_conf["max_tokens"]
if self.is_reasoning_model(self.model_name):
if self.is_reasoning_model(self.model_name) or self.model_name in ["qwen-vl-plus", "qwen-vl-plus-latest", "qwen-vl-max", "qwen-vl-max-latest"]:
return super().chat_streamly(system, history, gen_conf)

return self._chat_streamly(system, history, gen_conf)

Načítá se…
Zrušit
Uložit