|
|
|
@@ -16,7 +16,6 @@ |
|
|
|
|
|
|
|
import logging |
|
|
|
import json |
|
|
|
import math |
|
|
|
import re |
|
|
|
from collections import defaultdict |
|
|
|
|
|
|
|
@@ -234,11 +233,11 @@ class FulltextQueryer: |
|
|
|
s = 1e-9 |
|
|
|
for k, v in qtwt.items(): |
|
|
|
if k in dtwt: |
|
|
|
s += v * dtwt[k] |
|
|
|
s += v #* dtwt[k] |
|
|
|
q = 1e-9 |
|
|
|
for k, v in qtwt.items(): |
|
|
|
q += v * v |
|
|
|
return math.sqrt(3. * (s / q / math.log10( len(dtwt.keys()) + 512 ))) |
|
|
|
q += v #* v |
|
|
|
return s/q #math.sqrt(3. * (s / q / math.log10( len(dtwt.keys()) + 512 ))) |
|
|
|
|
|
|
|
def paragraph(self, content_tks: str, keywords: list = [], keywords_topn=30): |
|
|
|
if isinstance(content_tks, str): |