Pārlūkot izejas kodu

Fix: local variable issue. (#9255)

### What problem does this PR solve?

#9227

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
tags/v0.20.1
Kevin Hu pirms 2 mēnešiem
vecāks
revīzija
2124329e95
Revīzijas autora e-pasta adrese nav piesaistīta nevienam kontam
2 mainītis faili ar 7 papildinājumiem un 2 dzēšanām
  1. 1
    0
      rag/llm/cv_model.py
  2. 6
    2
      rag/svr/task_executor.py

+ 1
- 0
rag/llm/cv_model.py Parādīt failu

yield response.usage_metadata.total_token_count yield response.usage_metadata.total_token_count
else: else:
yield 0 yield 0


class NvidiaCV(Base): class NvidiaCV(Base):
_FACTORY_NAME = "NVIDIA" _FACTORY_NAME = "NVIDIA"

+ 6
- 2
rag/svr/task_executor.py Parādīt failu

return settings.docStoreConn.createIdx(idxnm, row.get("kb_id", ""), vector_size) return settings.docStoreConn.createIdx(idxnm, row.get("kb_id", ""), vector_size)




@timeout(60*20)
async def embedding(docs, mdl, parser_config=None, callback=None): async def embedding(docs, mdl, parser_config=None, callback=None):
if parser_config is None: if parser_config is None:
parser_config = {} parser_config = {}
tts = np.concatenate([vts for _ in range(len(tts))], axis=0) tts = np.concatenate([vts for _ in range(len(tts))], axis=0)
tk_count += c tk_count += c


@timeout(5)
def batch_encode(txts):
nonlocal mdl
return mdl.encode([truncate(c, mdl.max_length-10) for c in txts])

cnts_ = np.array([]) cnts_ = np.array([])
for i in range(0, len(cnts), EMBEDDING_BATCH_SIZE): for i in range(0, len(cnts), EMBEDDING_BATCH_SIZE):
async with embed_limiter: async with embed_limiter:
vts, c = await trio.to_thread.run_sync(lambda: mdl.encode([truncate(c, mdl.max_length-10) for c in cnts[i: i + EMBEDDING_BATCH_SIZE]]))
vts, c = await trio.to_thread.run_sync(lambda: batch_encode(cnts[i: i + EMBEDDING_BATCH_SIZE]))
if len(cnts_) == 0: if len(cnts_) == 0:
cnts_ = vts cnts_ = vts
else: else:

Notiek ielāde…
Atcelt
Saglabāt