hrs · prabhav-pandya · Nov 8, 2020 · Nov 8, 2020 · Nov 8, 2020 · Nov 8, 2020
diff --git a/.idea/.gitignore b/.idea/.gitignore
diff --git a/.idea/inspectionProfiles/profiles_settings.xml b/.idea/inspectionProfiles/profiles_settings.xml
diff --git a/.idea/misc.xml b/.idea/misc.xml
diff --git a/.idea/modules.xml b/.idea/modules.xml
diff --git a/.idea/python-tf-idf.iml b/.idea/python-tf-idf.iml
diff --git a/.idea/vcs.xml b/.idea/vcs.xml
diff --git a/README.md b/README.md
@@ -29,6 +29,10 @@ table.add_document("baz", ["kilo", "lima", "mike", "november"])
 
 print table.similarities(["alpha", "bravo", "charlie"]) # => [['foo', 0.6875], ['bar', 0.75], ['baz', 0.0]]
 ```
+To show top n results:
+```python
+print table.similarities(["alpha", "bravo", "charlie"], top_n = 2) # => [['bar', 0.75], ['foo', 0.6875]]
+```
 
 ### Run the tests
 

diff --git a/test_tfidf.py b/test_tfidf.py
@@ -10,9 +10,9 @@ def test_similarity(self):
         table.add_document("baz", ["k", "l", "m", "n"])
 
         self.assertEqual(
-            table.similarities(["a", "b", "c"]),
-            [["foo", 0.6875], ["bar", 0.75], ["baz", 0.0]])
+            table.similarities(["a", "b", "c"],2),
+            [["bar", 0.75],["foo", 0.6875]])
 
 
 if __name__ == "__main__":
-    unittest.main()
+    unittest.main()
diff --git a/tfidf.py b/tfidf.py
@@ -36,12 +36,12 @@ def add_document(self, doc_name, list_of_words):
         # add the normalized document to the corpus
         self.documents.append([doc_name, doc_dict])
 
-    def similarities(self, list_of_words):
-        """Returns a list of all the [docname, similarity_score] pairs relative to a
-list of words.
-
+    def similarities(self, list_of_words, top_n=-1):
+        """
+        Returns a list of all the [docname, similarity_score] pairs relative to a
+        list of words.
+        set top_n to any positive integer value to get the top n (set by the user) results.
         """
-
         # building the query dictionary
         query_dict = {}
         for w in list_of_words:
@@ -63,4 +63,17 @@ def similarities(self, list_of_words):
                       doc_dict[k] / self.corpus_dict[k])
             sims.append([doc[0], score])
 
+        # sorting and returning the top n results
+        if top_n > 0:
+            sims.sort(key=self.__get_score, reverse=True)
+            return sims[:top_n]
+
         return sims
+
+    def __get_score(self, sim_obj):
+        """
+        takes [docname, similarity_score] and returns similarity_score
+        private method used for top_n sorting
+        """
+        return sim_obj[1]
+