rapidsai · JohnZed · Nov 2, 2020 · Oct 23, 2020 · Oct 23, 2020 · Oct 26, 2020
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -11,6 +11,7 @@
 - PR #2906: Moving `linalg` decomp to RAFT namespaces
 - PR #2996: Removing the max_depth restriction for switching to the batched backend
 - PR #3004: Remove Single Process Multi GPU (SPMG) code
+- PR #3052: Speeding up MNMG KNN Cl&Re testing
 
 ## Bug Fixes
 - PR #2983: Fix seeding of KISS99 RNG

@@ -69,11 +69,11 @@ def dataset(request):
         if len(new_x) >= request.param['n_samples']:
             break
     X = X[new_x]
-    noise = np.random.normal(0, 1.2, X.shape)
+    noise = np.random.normal(0, 5., X.shape)
     X += noise
     y = np.array(new_y)
 
-    return train_test_split(X, y, test_size=0.1)
+    return train_test_split(X, y, test_size=0.3)
 
 
 def exact_match(output1, output2):
@@ -108,9 +108,9 @@ def check_probabilities(l_probas, d_probas):
 
 
 @pytest.mark.parametrize("datatype", ['dask_array', 'dask_cudf'])
-@pytest.mark.parametrize("n_neighbors", [1, 3, 8])
-@pytest.mark.parametrize("n_parts", [2, 4, 12])
-@pytest.mark.parametrize("batch_size", [128, 1024])
+@pytest.mark.parametrize("n_neighbors", [8])
+@pytest.mark.parametrize("n_parts", [2, 3, 8])
+@pytest.mark.parametrize("batch_size", [256])
 def test_predict_and_score(dataset, datatype, n_neighbors,
                            n_parts, batch_size, client):
     X_train, X_test, y_train, y_test = dataset
@@ -165,9 +165,9 @@ def test_predict_and_score(dataset, datatype, n_neighbors,
 
 
 @pytest.mark.parametrize("datatype", ['dask_array', 'dask_cudf'])
-@pytest.mark.parametrize("n_neighbors", [1, 3, 8])
-@pytest.mark.parametrize("n_parts", [2, 4, 12])
-@pytest.mark.parametrize("batch_size", [128, 1024])
+@pytest.mark.parametrize("n_neighbors", [8])
+@pytest.mark.parametrize("n_parts", [2, 3, 8])
+@pytest.mark.parametrize("batch_size", [256])
 def test_predict_proba(dataset, datatype, n_neighbors,
                        n_parts, batch_size, client):
     X_train, X_test, y_train, y_test = dataset

@@ -70,11 +70,11 @@ def dataset(request):
         if len(new_x) >= request.param['n_samples']:
             break
     X = X[new_x]
-    noise = np.random.normal(0, 1.2, X.shape)
+    noise = np.random.normal(0, 5., X.shape)
     X += noise
     y = np.array(new_y, dtype=np.float32)
 
-    return train_test_split(X, y, test_size=0.1)
+    return train_test_split(X, y, test_size=0.3)
 
 
 def exact_match(output1, output2):
@@ -102,9 +102,9 @@ def exact_match(output1, output2):
 
 
 @pytest.mark.parametrize("datatype", ['dask_array', 'dask_cudf'])
-@pytest.mark.parametrize("n_neighbors", [1, 3, 8])
-@pytest.mark.parametrize("n_parts", [2, 4, 12])
-@pytest.mark.parametrize("batch_size", [128, 1024])
+@pytest.mark.parametrize("n_neighbors", [8])
+@pytest.mark.parametrize("n_parts", [2, 3, 8])
+@pytest.mark.parametrize("batch_size", [256])
 def test_predict_and_score(dataset, datatype, n_neighbors,
                            n_parts, batch_size, client):
     X_train, X_test, y_train, y_test = dataset