Преглед на файлове

refine token similarity (#2824)

### What problem does this PR solve?


### Type of change

- [x] Performance Improvement
tags/v0.13.0
Kevin Hu преди 1 година
родител
ревизия
b164116277
No account linked to committer's email address
променени са 2 файла, в които са добавени 3 реда и са изтрити 6 реда
  1. 1
    1
      agent/canvas.py
  2. 2
    5
      rag/nlp/query.py

+ 1
- 1
agent/canvas.py Целия файл

convs = [] convs = []
for role, obj in self.history[(window_size + 1) * -1:]: for role, obj in self.history[(window_size + 1) * -1:]:
convs.append({"role": role, "content": (obj if role == "user" else convs.append({"role": role, "content": (obj if role == "user" else
'\n'.join(pd.DataFrame(obj)['content']))})
'\n'.join([str(s) for s in pd.DataFrame(obj)['content']]))})
return convs return convs


def add_user_input(self, question): def add_user_input(self, question):

+ 2
- 5
rag/nlp/query.py Целия файл

s += v # * dtwt[k] s += v # * dtwt[k]
q = 1e-9 q = 1e-9
for k, v in qtwt.items(): for k, v in qtwt.items():
q += v # * v
#d = 1e-9
# for k, v in dtwt.items():
# d += v * v
return s / q / max(1, math.sqrt(math.log10(max(len(qtwt.keys()), len(dtwt.keys())))))# math.sqrt(q) / math.sqrt(d)
q += v
return s / q

Loading…
Отказ
Запис