瀏覽代碼

refine xinference (#2521)

### What problem does this PR solve?

#1588

### Type of change

- [x] Refactoring
tags/v0.12.0
Kevin Hu 1 年之前
父節點
當前提交
4a6a2a0f1b
沒有連結到貢獻者的電子郵件帳戶。
共有 4 個檔案被更改,包括 8 行新增0 行删除
  1. 2
    0
      rag/llm/cv_model.py
  2. 2
    0
      rag/llm/embedding_model.py
  3. 2
    0
      rag/llm/rerank_model.py
  4. 2
    0
      rag/llm/sequence2txt_model.py

+ 2
- 0
rag/llm/cv_model.py 查看文件

@@ -449,6 +449,8 @@ class LocalAICV(GptV4):

class XinferenceCV(Base):
def __init__(self, key, model_name="", lang="Chinese", base_url=""):
if base_url.split("/")[-1] != "v1":
base_url = os.path.join(base_url, "v1")
self.client = OpenAI(api_key="xxx", base_url=base_url)
self.model_name = model_name
self.lang = lang

+ 2
- 0
rag/llm/embedding_model.py 查看文件

@@ -268,6 +268,8 @@ class FastEmbed(Base):

class XinferenceEmbed(Base):
def __init__(self, key, model_name="", base_url=""):
if base_url.split("/")[-1] != "v1":
base_url = os.path.join(base_url, "v1")
self.client = OpenAI(api_key="xxx", base_url=base_url)
self.model_name = model_name


+ 2
- 0
rag/llm/rerank_model.py 查看文件

@@ -140,6 +140,8 @@ class YoudaoRerank(DefaultRerank):

class XInferenceRerank(Base):
def __init__(self, key="xxxxxxx", model_name="", base_url=""):
if base_url.split("/")[-1] != "v1":
base_url = os.path.join(base_url, "v1")
self.model_name = model_name
self.base_url = base_url
self.headers = {

+ 2
- 0
rag/llm/sequence2txt_model.py 查看文件

@@ -93,6 +93,8 @@ class AzureSeq2txt(Base):

class XinferenceSeq2txt(Base):
def __init__(self, key, model_name="", base_url=""):
if base_url.split("/")[-1] != "v1":
base_url = os.path.join(base_url, "v1")
self.client = OpenAI(api_key="xxx", base_url=base_url)
self.model_name = model_name


Loading…
取消
儲存