Skip to content

Commit

Permalink
add direct metrics pushed to datadog
Browse files Browse the repository at this point in the history
  • Loading branch information
Mefl committed Dec 24, 2024
1 parent f8fa855 commit f54d6cb
Show file tree
Hide file tree
Showing 8 changed files with 218 additions and 10 deletions.
15 changes: 15 additions & 0 deletions api/index.js
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,8 @@ import { validateEnvironmentVariables } from './src/shared/infrastructure/valida

validateEnvironmentVariables();

import metrics from 'datadog-metrics';

import { disconnect, prepareDatabaseConnection } from './db/knex-database-connection.js';
import { createServer } from './server.js';
import { config } from './src/shared/config.js';
Expand Down Expand Up @@ -35,6 +37,19 @@ async function _exitOnSignal(signal) {
logger.info(`Received signal: ${signal}.`);
logger.info('Stopping HAPI server...');
await server.stop({ timeout: 30000 });
if (server.pixCustomIntervals) {
metrics.gauge('captain.api.conteneur', 0);
metrics.gauge(`captain.api.memory.rss`, 0);
metrics.gauge('captain.api.memory.heapTotal', 0);
metrics.gauge('captain.api.memory.heapUsed', 0);
metrics.gauge('captain.api.knex.db_connections_used', 0);
metrics.gauge('captain.api.knex.db_connections_free', 0);
metrics.gauge('captain.api.knex.db_connections_pending_creation', 0);
metrics.gauge('captain.api.knex.db_connections_pending_destroy', 0);
logger.info('Closing metrics interval and flush metrics');
server.pixCustomIntervals.forEach(clearInterval);
metrics.flush();
}
if (server.oppsy) {
logger.info('Stopping HAPI Oppsy server...');
await server.oppsy.stop();
Expand Down
104 changes: 104 additions & 0 deletions api/package-lock.json

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

1 change: 1 addition & 0 deletions api/package.json
Original file line number Diff line number Diff line change
Expand Up @@ -39,6 +39,7 @@
"cron-parser": "^4.9.0",
"dataloader": "^2.2.2",
"dayjs": "^1.11.5",
"datadog-metrics": "^0.12.0",
"debug": "^4.3.4",
"dotenv": "^16.0.1",
"fast-levenshtein": "^3.0.0",
Expand Down
8 changes: 8 additions & 0 deletions api/sample.env
Original file line number Diff line number Diff line change
Expand Up @@ -49,6 +49,14 @@ REDIS_URL=redis://localhost:6379
# default: none
# CACHE_RELOAD_CONTAINER_SIZE=M

# =====
# DATADOG
# =====

# Datadog access context
#
DATADOG_API_KEY=nokey

# =========
# DATABASES
# =========
Expand Down
65 changes: 64 additions & 1 deletion api/server.js
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
import Oppsy from '@1024pix/oppsy';
import Hapi from '@hapi/hapi';
import metrics from 'datadog-metrics';
import { parse } from 'neoqs';

import { setupErrorHandling } from './config/server-setup-error-handling.js';
Expand Down Expand Up @@ -36,6 +37,7 @@ import { config } from './src/shared/config.js';
import { monitoringTools } from './src/shared/infrastructure/monitoring-tools.js';
import { plugins } from './src/shared/infrastructure/plugins/index.js';
import { deserializer } from './src/shared/infrastructure/serializers/jsonapi/deserializer.js';
import { logger } from './src/shared/infrastructure/utils/logger.js';
// bounded context migration
import { sharedRoutes } from './src/shared/routes.js';
import { swaggers } from './src/shared/swaggers.js';
Expand Down Expand Up @@ -70,7 +72,26 @@ const { logOpsMetrics, port, logging } = config;
const createServer = async () => {
const server = createBareServer();

if (logOpsMetrics) await enableOpsMetrics(server);
// initialisation of Datadog link for metrics publication
if (config.environment !== 'development' || config.featureToggles.isDirectMetricsEnabled) {
logger.info('Metric initialisation : linked to Datadog');
metrics.init({
host: config.infra.containerName,
prefix: '',
flushIntervalSeconds: config.infra.metricsFlushIntervalSecond,
defaultTags: [`service:${config.infra.appName}`],
});
} else {
logger.info('Metric initialisation : no reporter => no metrics sent');
metrics.init({ reporter: metrics.NullReporter() });
}

if (logOpsMetrics) {
// OPS metrics via direct metrics
if (config.featureToggles.isDirectMetricsEnabled) await enableOpsMetrics(server);
// OPS metrics via Oppsy
if (!config.featureToggles.isOppsyDisabled) await enableLegacyOpsMetrics(server);
}

setupErrorHandling(server);

Expand Down Expand Up @@ -126,6 +147,48 @@ const createBareServer = function () {
};

const enableOpsMetrics = async function (server) {
function collectMemoryStats() {
const memUsage = process.memoryUsage();
metrics.gauge(`captain.api.memory.rss`, memUsage.rss);
metrics.gauge('captain.api.memory.heapTotal', memUsage.heapTotal);
metrics.gauge('captain.api.memory.heapUsed', memUsage.heapUsed);
metrics.gauge('captain.api.conteneur', 1);
}

const metricsInterval = setInterval(collectMemoryStats, 5000);
server.pixCustomIntervals = [metricsInterval];

const gaugeConnections = (pool) => () => {
logger.info('publie les metrics de knex');
metrics.gauge('captain.api.knex.db_connections_used', pool.numUsed());
metrics.gauge('captain.api.knex.db_connections_free', pool.numFree());
metrics.gauge('captain.api.knex.db_connections_pending_creation', pool.numPendingCreates());
metrics.gauge('captain.api.knex.db_connections_pending_destroy', pool['pendingDestroys'].length);
};

const client = knex.client;
gaugeConnections(client.pool)();

client.pool.on('createSuccess', gaugeConnections(client.pool));
client.pool.on('acquireSuccess', gaugeConnections(client.pool));
client.pool.on('release', gaugeConnections(client.pool));
client.pool.on('destroySuccess', gaugeConnections(client.pool));

server.events.on('response', (request) => {
const info = request.info;

const statusCode = request.raw.res.statusCode;
const responseTime = (info.completed !== undefined ? info.completed : info.responded) - info.received;

metrics.histogram('captain.api.duration', responseTime, [
`method:${request.route.method}`,
`route:${request.route.path}`,
`statusCode:${statusCode}`,
]);
});
};

const enableLegacyOpsMetrics = async function (server) {
const oppsy = new Oppsy(server);

oppsy.on('ops', (data) => {
Expand Down
10 changes: 10 additions & 0 deletions api/src/shared/config.js
Original file line number Diff line number Diff line change
Expand Up @@ -251,9 +251,11 @@ const configuration = (function () {
process.env.FT_ALWAYS_OK_VALIDATE_NEXT_CHALLENGE_ENDPOINT,
),
isAsyncQuestRewardingCalculationEnabled: toBoolean(process.env.FT_ENABLE_ASYNC_QUESTS_REWARDS_CALCULATION),
isDirectMetricsEnabled: toBoolean(process.env.FT_ENABLE_DIRECT_METRICS),
isNeedToAdjustCertificationAccessibilityEnabled: toBoolean(
process.env.FT_ENABLE_NEED_TO_ADJUST_CERTIFICATION_ACCESSIBILITY,
),
isOppsyDisabled: toBoolean(process.env.FT_OPPSY_DISABLED),
isPix1dEnabled: toBoolean(process.env.FT_PIX_1D_ENABLED),
isPixCompanionEnabled: toBoolean(process.env.FT_PIX_COMPANION_ENABLED),
isSelfAccountDeletionEnabled: toBoolean(process.env.FT_SELF_ACCOUNT_DELETION),
Expand All @@ -270,12 +272,15 @@ const configuration = (function () {
enableRequestMonitoring: toBoolean(process.env.ENABLE_REQUEST_MONITORING),
},
infra: {
appName: process.env.APP,
containerName: process.env.CONTAINER,
concurrencyForHeavyOperations: _getNumber(process.env.INFRA_CONCURRENCY_HEAVY_OPERATIONS, 2),
chunkSizeForCampaignResultProcessing: _getNumber(process.env.INFRA_CHUNK_SIZE_CAMPAIGN_RESULT_PROCESSING, 10),
chunkSizeForOrganizationLearnerDataProcessing: _getNumber(
process.env.INFRA_CHUNK_SIZE_ORGANIZATION_LEARNER_DATA_PROCESSING,
1000,
),
metricsFlushIntervalSecond: _getNumber(process.env.METRICS_FLUSH_INTERVAL_SECOND, 15),
startJobInWebProcess: toBoolean(process.env.START_JOB_IN_WEB_PROCESS),
},
jwtConfig: {
Expand Down Expand Up @@ -344,6 +349,9 @@ const configuration = (function () {
},
},
},
metrics: {
flushIntervalSeconds: _getNumber(process.env.DIRECT_METRICS_FLUSH_INTERVAL, 5),
},
partner: {
fetchTimeOut: ms(process.env.FETCH_TIMEOUT_MILLISECONDS || '20s'),
},
Expand Down Expand Up @@ -478,7 +486,9 @@ const configuration = (function () {

config.featureToggles.deprecatePoleEmploiPushNotification = false;
config.featureToggles.isAlwaysOkValidateNextChallengeEndpointEnabled = false;
config.featureToggles.isDirectMetricsEnabled = false;
config.featureToggles.isNeedToAdjustCertificationAccessibilityEnabled = false;
config.featureToggles.isOppsyDisabled = false;
config.featureToggles.isPix1dEnabled = true;
config.featureToggles.isPixCompanionEnabled = false;
config.featureToggles.isSelfAccountDeletionEnabled = false;
Expand Down
Loading

0 comments on commit f54d6cb

Please sign in to comment.