capitalone · taylorfturner · Nov 8, 2022 · Nov 4, 2022 · Nov 4, 2022 · Nov 4, 2022
@@ -2240,7 +2240,20 @@ def _update_null_replication_metrics(self, clean_samples: Dict) -> None:
         :param clean_samples: input cleaned dataset
         :type clean_samples: dict
         """
-        data = pd.DataFrame(clean_samples).apply(pd.to_numeric, errors="coerce")
+        data = pd.DataFrame(clean_samples)
+
+        # If the last row is all null, then add rows to the data DataFrame
+        max_null_index = max(
+            [max(i) for i in getattr(self._profile[0], "null_types_index").values()],
+            default=0,
+        )
+        if max_null_index > data.index.max():
+            data.loc[max_null_index] = {}
+
+        # Fill in missing rows with NaN and convert types to numeric
+        data = data.reindex(range(data.index.max() + 1), fill_value=np.nan).apply(
+            pd.to_numeric, errors="coerce"
+        )
 
         get_data_type = lambda profile: profile.profiles[  # NOQA: E731
             "data_type_profile"

@@ -2081,6 +2081,21 @@ def test_null_replication_metrics_calculation(self):
         np.testing.assert_array_almost_equal([[np.nan], [18]], column["class_sum"])
         np.testing.assert_array_almost_equal([[np.nan], [9]], column["class_mean"])
 
+        # Test with all null in a row
+        data_4 = pd.DataFrame(
+            [[10, 20], [9999999, 9999999], [30, 9999999], [9999999, 9999999]]
+        )
+
+        profiler = dp.StructuredProfiler(data_4, options=profile_options)
+        report = profiler.report()
+
+        self.assertTrue("null_replication_metrics" in report["data_stats"][0])
+        column = report["data_stats"][0]["null_replication_metrics"]
+
+        np.testing.assert_array_almost_equal([0.5, 0.5], column["class_prior"])
+        np.testing.assert_array_almost_equal([[20], [0]], column["class_sum"])
+        np.testing.assert_array_almost_equal([[10], [0]], column["class_mean"])
+
     def test_column_level_invalid_values(self):
         data = pd.DataFrame([[1, 1], [9999999, 2], [3, 3]])