Skip to content

Commit 561fcf7

Browse files
author
Roberto Alsina
committedMay 23, 2017
lint
1 parent fdc0f59 commit 561fcf7

File tree

1 file changed

+3
-4
lines changed

1 file changed

+3
-4
lines changed
 

‎v7/similarity/similarity.py

+3-4
Original file line numberDiff line numberDiff line change
@@ -71,7 +71,6 @@ def write_similar(path, related):
7171
with open(path, 'w+') as outf:
7272
json.dump(data, outf)
7373

74-
7574
def tags_similarity(p1, p2):
7675
t1 = set(p1.tags)
7776
t2 = set(p2.tags)
@@ -98,16 +97,16 @@ def title_similarity(p1, p2):
9897
index = gensim.similarities.MatrixSimilarity(lsi[corpus])
9998
for i, post in enumerate(self.site.timeline):
10099
# FIXME config output
101-
out_name = os.path.join('output', post.destination_path(lang=lang))+'.related.json'
100+
out_name = os.path.join('output', post.destination_path(lang=lang)) + '.related.json'
102101
doc = texts[i]
103102
vec_bow = dictionary.doc2bow(doc)
104103
vec_lsi = lsi[vec_bow]
105104
body_sims = index[vec_lsi]
106105
tag_sims = [tags_similarity(post, p) for p in self.site.timeline]
107106
title_sims = [title_similarity(post, p) for p in self.site.timeline]
108-
full_sims = [tag_sims[i] + title_sims[i] + body_sims[i] *2 for i in range(len(self.site.timeline))]
107+
full_sims = [tag_sims[i] + title_sims[i] + body_sims[i] * 1.5 for i in range(len(self.site.timeline))]
109108
full_sims = sorted(enumerate(full_sims), key=lambda item: -item[1])
110-
related = [(self.site.timeline[s[0]], s[1], tag_sims[s[0]], title_sims[s[0]], body_sims[s[0]]) for s in full_sims[:11] if s[0] != i ]
109+
related = [(self.site.timeline[s[0]], s[1], tag_sims[s[0]], title_sims[s[0]], body_sims[s[0]]) for s in full_sims[:11] if s[0] != i]
111110
task = {
112111
'basename': self.name,
113112
'name': out_name,

0 commit comments

Comments
 (0)
Please sign in to comment.