piskvorky · tmylk · Aug 11, 2016 · Jul 25, 2016 · Aug 10, 2016 · Aug 10, 2016
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -11,6 +11,7 @@ Changes
 * Implemented LsiModel.docs_processed attribute
 * Added LdaMallet support. Added LdaVowpalWabbit, LdaMallet example to notebook. Added test suite for coherencemodel and aggregation.
   Added `topics` parameter to coherencemodel. Can now provide tokenized topics to calculate coherence value (@dsquareindia, #750)
+* Added a check for empty (no words) documents before starting to run the DTM wrapper if model = "fixed" is used (DIM model) as this    causes the an error when such documents are reached in training. (@eickho, #806)
 
 0.13.1, 2016-06-22
 

diff --git a/gensim/models/wrappers/dtmmodel.py b/gensim/models/wrappers/dtmmodel.py
@@ -93,6 +93,9 @@ def __init__(
             lencorpus = sum(1 for _ in corpus)
         if lencorpus == 0:
             raise ValueError("cannot compute DTM over an empty corpus")
+        if model == "fixed" and any([i == 0 for i in [len(text) for text in corpus.get_texts()]]):
+            raise ValueError("""There is a text without words in the input corpus.
+                    This breaks method='fixed' (The DIM model).""")
         if lencorpus != sum(time_slices):
             raise ValueError("mismatched timeslices %{slices} for corpus of len {clen}".format(
                 slices=sum(time_slices), clen=lencorpus))