Thanks to visit codestin.com
Credit goes to github.com

Skip to content

Commit fe7450d

Browse files
author
Hai Liang Wang
committed
Closed chatopera#77 fix package version for better compatibility
1 parent b23e1c3 commit fe7450d

3 files changed

Lines changed: 17 additions & 8 deletions

File tree

demo.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -137,6 +137,13 @@ def test_nearby(self):
137137
def test_badcase_1(self):
138138
synonyms.display("人脸") # synonyms.display calls synonyms.nearby
139139

140+
141+
def test_basecase_2(self):
142+
print("test_basecase_2")
143+
sen1 = "今天天气"
144+
sen2 = "今天天气怎么样"
145+
r = synonyms.compare(sen1, sen2, seg=True)
146+
140147
def test():
141148
unittest.main()
142149

setup.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313

1414
setup(
1515
name='synonyms',
16-
version='3.10.0',
16+
version='3.10.2',
1717
description='Chinese Synonyms for Natural Language Processing and Understanding',
1818
long_description=LONGDOC,
1919
author='Hai Liang Wang, Hu Ying Xi',
@@ -40,9 +40,9 @@
4040
install_requires=[
4141
'six>=1.11.0',
4242
'numpy>=1.13.1',
43-
'scipy==1.0.0',
44-
'scikit-learn==0.19.1',
45-
'absl-py==0.1.10'
43+
'scipy>=1.0.0',
44+
'scikit-learn>=0.19.1',
45+
'absl-py>=0.4'
4646
],
4747
package_data={
4848
'synonyms': [

synonyms/synonyms.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -247,8 +247,10 @@ def _nearby_levenshtein_distance(s1, s2):
247247

248248
scores = []
249249
for x in second:
250-
scores.append(max([_levenshtein_distance(x, y) for y in ft]))
251-
s = np.sum(scores) / maxlen
250+
choices = [_levenshtein_distance(x, y) for y in ft]
251+
if len(choices) > 0: scores.append(max(choices))
252+
253+
s = np.sum(scores) / maxlen if len(scores) > 0 else 0
252254
return s
253255

254256
def _similarity_distance(s1, s2, ignore):
@@ -319,8 +321,8 @@ def compare(s1, s2, seg=True, ignore=False, stopwords=False):
319321
s2_words = []
320322

321323
if seg:
322-
s1 = [x for x in jieba.cut(s1)]
323-
s2 = [x for x in jieba.cut(s2)]
324+
s1 = [x for x in jieba.cut(s1, cut_all=False, HMM=False)]
325+
s2 = [x for x in jieba.cut(s2, cut_all=False, HMM=False)]
324326
else:
325327
s1 = s1.split()
326328
s2 = s2.split()

0 commit comments

Comments
 (0)