facebookresearch · mojtaba-komeili · Jul 23, 2021 · May 25, 2021 · Jul 22, 2021 · Jul 23, 2021
diff --git a/parlai/crowdsourcing/utils/acceptability.py b/parlai/crowdsourcing/utils/acceptability.py
@@ -10,6 +10,9 @@
 from parlai.utils.safety import OffensiveStringMatcher
 
 
+DEFAULT_MIN_WORDS_THRESHOLD = 3
+
+
 class AcceptabilityChecker:
 
     ALL_VIOLATION_TYPES = [
@@ -20,8 +23,9 @@ class AcceptabilityChecker:
         'safety',
     ]
 
-    def __init__(self):
+    def __init__(self, min_words=DEFAULT_MIN_WORDS_THRESHOLD):
         self.offensive_lang_detector = OffensiveStringMatcher()
+        self.min_words_violation_threshold = min_words
 
     def check_messages(
         self,
@@ -57,7 +61,7 @@ def check_messages(
         # Do messages have the minimum acceptable average number of words?
         if 'min_words' in violation_types:
             total_num_words = sum([len(message.split()) for message in messages])
-            if total_num_words / len(messages) < 3:
+            if total_num_words / len(messages) < self.min_words_violation_threshold:
                 violations.append('under_min_length')
 
         # Does the first message start with a greeting, indicating that the Turker