Skip to content

Commit

Permalink
Use Counter
Browse files Browse the repository at this point in the history
  • Loading branch information
tosemml authored Sep 1, 2023
1 parent c17bff9 commit b16d5d4
Showing 1 changed file with 2 additions and 5 deletions.
7 changes: 2 additions & 5 deletions similarities/utils/rank_bm25.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@

import math
from multiprocessing import Pool, cpu_count
from collections import Counter

import numpy as np

Expand Down Expand Up @@ -36,11 +37,7 @@ def _initialize(self, corpus):
self.doc_len.append(len(document))
num_doc += len(document)

frequencies = {}
for word in document:
if word not in frequencies:
frequencies[word] = 0
frequencies[word] += 1
frequencies = dict(Counter(document))
self.doc_freqs.append(frequencies)

for word, freq in frequencies.items():
Expand Down

0 comments on commit b16d5d4

Please sign in to comment.