Skip to content

Commit 04ce18e

Browse files
committed
fix order of source issue in find_duplicate
1 parent 94ec663 commit 04ce18e

File tree

1 file changed

+4
-5
lines changed

1 file changed

+4
-5
lines changed

application.py

Lines changed: 4 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -83,11 +83,10 @@ def find_duplicate():
8383
doc_ids, dists = imagesearch.search(vec, thresh)
8484
else:
8585
doc_ids, dists = imagesearch.search(vec)
86-
87-
sources = [d.get('source') for d in db.docs.find({"doc_id" : {"$in" : doc_ids}})]
86+
sources = {d.get('doc_id') : d.get('source') for d in db.docs.find({"doc_id" : {"$in" : doc_ids}})}
8887

8988
if doc_ids is not None:
90-
result = [{'doc_id' : doc_ids[i], 'dist' : dists[i], 'source' : sources[i]} for i in range(len(doc_ids))]
89+
result = [{'doc_id' : doc_ids[i], 'dist' : dists[i], 'source' : sources[doc_ids[i]]} for i in range(len(doc_ids))]
9190
ret = {'failed' : 0, 'result' : result}
9291
else:
9392
ret = {'failed' : 0, 'result' : []}
@@ -96,10 +95,10 @@ def find_duplicate():
9695
duplicate_doc = db.docs.find_one({"text" : text})
9796
vec = doc2vec(text)
9897
doc_ids, dists = textsearch.search(vec)
99-
sources = [d.get('source') for d in db.docs.find({"doc_id" : {"$in" : doc_ids}})]
98+
sources = {d.get('doc_id') : d.get('source') for d in db.docs.find({"doc_id" : {"$in" : doc_ids}})}
10099

101100
if doc_ids is not None:
102-
result = [{'doc_id' : doc_ids[i], 'dist' : dists[i], 'source' : sources[i]} for i in range(len(doc_ids))]
101+
result = [{'doc_id' : doc_ids[i], 'dist' : dists[i], 'source' : sources[doc_ids[i]]} for i in range(len(doc_ids))]
103102
else:
104103
result = []
105104

0 commit comments

Comments
 (0)