-
Notifications
You must be signed in to change notification settings - Fork 8.3k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge remote-tracking branch 'upstream/main' into 164059-untracked-di…
…sabled-alerts
- Loading branch information
Showing
43 changed files
with
1,336 additions
and
1,330 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,4 @@ | ||
# @kbn/ml-chi2test | ||
|
||
`computeChi2PValue` computes the p-value for how similar the datasets are. | ||
Returned value ranges from 0 to 1, with 1 meaning the datasets are identical. |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,48 @@ | ||
/* | ||
* Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one | ||
* or more contributor license agreements. Licensed under the Elastic License | ||
* 2.0; you may not use this file except in compliance with the Elastic License | ||
* 2.0. | ||
*/ | ||
|
||
import { criticalTableLookup } from './critical_table_lookup'; | ||
import type { Histogram } from './types'; | ||
|
||
/** | ||
* Compute the p-value for how similar the datasets are. | ||
* Returned value ranges from 0 to 1, with 1 meaning the datasets are identical. | ||
* | ||
* @param {Histogram[]} normalizedBaselineTerms - An array of normalized baseline terms (Histogram objects). | ||
* @param {Histogram[]} normalizedDriftedTerms - An array of normalized drifted terms (Histogram objects). | ||
* @returns {number} The p-value indicating the similarity of the datasets. | ||
*/ | ||
export const computeChi2PValue = ( | ||
normalizedBaselineTerms: Histogram[], | ||
normalizedDriftedTerms: Histogram[] | ||
) => { | ||
// Get all unique keys from both arrays | ||
const allKeys: string[] = Array.from( | ||
new Set([ | ||
...normalizedBaselineTerms.map((term) => term.key.toString()), | ||
...normalizedDriftedTerms.map((term) => term.key.toString()), | ||
]) | ||
).slice(0, 100); | ||
|
||
// Calculate the chi-squared statistic and degrees of freedom | ||
let chiSquared: number = 0; | ||
const degreesOfFreedom: number = allKeys.length - 1; | ||
|
||
if (degreesOfFreedom === 0) return 1; | ||
|
||
allKeys.forEach((key) => { | ||
const baselineTerm = normalizedBaselineTerms.find((term) => term.key === key); | ||
const driftedTerm = normalizedDriftedTerms.find((term) => term.key === key); | ||
|
||
const observed: number = driftedTerm?.percentage ?? 0; | ||
const expected: number = baselineTerm?.percentage ?? 0; | ||
chiSquared += Math.pow(observed - expected, 2) / (expected > 0 ? expected : 1e-6); // Prevent divide by zero | ||
}); | ||
|
||
// Use the criticalTableLookup function to determine the p-value | ||
return criticalTableLookup(chiSquared, degreesOfFreedom); | ||
}; |
Oops, something went wrong.