Skip to content

Commit

Permalink
Merge pull request #15 from tosemml/patch-1
Browse files Browse the repository at this point in the history
Code refactoring
  • Loading branch information
shibing624 authored Sep 4, 2023
2 parents c17bff9 + b16d5d4 commit 6edb3c6
Showing 1 changed file with 2 additions and 5 deletions.
7 changes: 2 additions & 5 deletions similarities/utils/rank_bm25.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@

import math
from multiprocessing import Pool, cpu_count
from collections import Counter

import numpy as np

Expand Down Expand Up @@ -36,11 +37,7 @@ def _initialize(self, corpus):
self.doc_len.append(len(document))
num_doc += len(document)

frequencies = {}
for word in document:
if word not in frequencies:
frequencies[word] = 0
frequencies[word] += 1
frequencies = dict(Counter(document))
self.doc_freqs.append(frequencies)

for word, freq in frequencies.items():
Expand Down

0 comments on commit 6edb3c6

Please sign in to comment.