Skip to content

Commit

Permalink
[APM] Check if metric fields exist (#145348)
Browse files Browse the repository at this point in the history
Fixes the error 
```
"script_stack": [
            "[email protected]/org.elasticsearch.index.fielddata.ScriptDocValues.throwIfEmpty(ScriptDocValues.java:92)",
            "[email protected]/org.elasticsearch.index.fielddata.ScriptDocValues$Longs.get(ScriptDocValues.java:110)",
            "[email protected]/org.elasticsearch.index.fielddata.ScriptDocValues$Longs.getValue(ScriptDocValues.java:105)",
            """total = useCgroupLimit ? doc[limitKey].value : doc['system.memory.total'].value;

    double """,
            "                                                                         ^---- HERE"


```

connected elastic/sdh-apm#765 (internal)

---------

Co-authored-by: kibanamachine <[email protected]>
Co-authored-by: Søren Louv-Jansen <[email protected]>
  • Loading branch information
3 people authored Apr 27, 2023
1 parent 61c82dc commit 98165d2
Show file tree
Hide file tree
Showing 8 changed files with 263 additions and 35 deletions.
2 changes: 2 additions & 0 deletions packages/kbn-apm-synthtrace-client/src/lib/apm/apm_fields.ts
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,8 @@ export type ApmApplicationMetricFields = Partial<{
'system.process.memory.size': number;
'system.memory.actual.free': number;
'system.memory.total': number;
'system.process.cgroup.memory.mem.limit.bytes': number;
'system.process.cgroup.memory.mem.usage.bytes': number;
'system.cpu.total.norm.pct': number;
'system.process.memory.rss.bytes': number;
'system.process.cpu.total.norm.pct': number;
Expand Down

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

Original file line number Diff line number Diff line change
Expand Up @@ -47,6 +47,15 @@ const chartBase: ChartBase = {
series,
};

export const systemMemoryFilter = {
bool: {
filter: [
{ exists: { field: METRIC_SYSTEM_FREE_MEMORY } },
{ exists: { field: METRIC_SYSTEM_TOTAL_MEMORY } },
],
},
};

export const percentSystemMemoryUsedScript = {
lang: 'painless',
source: `
Expand All @@ -60,6 +69,17 @@ export const percentSystemMemoryUsedScript = {
`,
} as const;

export const cgroupMemoryFilter = {
bool: {
filter: [{ exists: { field: METRIC_CGROUP_MEMORY_USAGE_BYTES } }],
should: [
{ exists: { field: METRIC_CGROUP_MEMORY_LIMIT_BYTES } },
{ exists: { field: METRIC_SYSTEM_TOTAL_MEMORY } },
],
minimum_should_match: 1,
},
};

export const percentCgroupMemoryUsedScript = {
lang: 'painless',
source: `
Expand Down Expand Up @@ -147,7 +167,7 @@ export async function getMemoryChartData({
memoryUsedMax: { max: { script: percentCgroupMemoryUsedScript } },
},
additionalFilters: [
{ exists: { field: METRIC_CGROUP_MEMORY_USAGE_BYTES } },
cgroupMemoryFilter,
...termQuery(FAAS_ID, serverlessId),
],
operationName: 'get_cgroup_memory_metrics_charts',
Expand All @@ -169,8 +189,7 @@ export async function getMemoryChartData({
memoryUsedMax: { max: { script: percentSystemMemoryUsedScript } },
},
additionalFilters: [
{ exists: { field: METRIC_SYSTEM_FREE_MEMORY } },
{ exists: { field: METRIC_SYSTEM_TOTAL_MEMORY } },
systemMemoryFilter,
...termQuery(FAAS_ID, serverlessId),
],
operationName: 'get_system_memory_metrics_charts',
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -9,10 +9,7 @@ import type { ESFilter } from '@kbn/es-types';
import { rangeQuery } from '@kbn/observability-plugin/server';
import { ProcessorEvent } from '@kbn/observability-plugin/common';
import {
METRIC_CGROUP_MEMORY_USAGE_BYTES,
METRIC_SYSTEM_CPU_PERCENT,
METRIC_SYSTEM_FREE_MEMORY,
METRIC_SYSTEM_TOTAL_MEMORY,
SERVICE_NAME,
TRANSACTION_TYPE,
} from '../../../common/es_fields/apm';
Expand All @@ -31,6 +28,8 @@ import { withApmSpan } from '../../utils/with_apm_span';
import {
percentCgroupMemoryUsedScript,
percentSystemMemoryUsedScript,
systemMemoryFilter,
cgroupMemoryFilter,
} from '../metrics/by_agent/shared/memory';
import { APMEventClient } from '../../lib/helpers/create_es_client/create_apm_event_client';
import { ApmDocumentType } from '../../../common/document_type';
Expand Down Expand Up @@ -358,19 +357,14 @@ function getMemoryStats({
};

let memoryUsage = await getMemoryUsage({
additionalFilters: [
{ exists: { field: METRIC_CGROUP_MEMORY_USAGE_BYTES } },
],
script: percentCgroupMemoryUsedScript,
additionalFilters: [cgroupMemoryFilter],
});

if (!memoryUsage) {
memoryUsage = await getMemoryUsage({
additionalFilters: [
{ exists: { field: METRIC_SYSTEM_FREE_MEMORY } },
{ exists: { field: METRIC_SYSTEM_TOTAL_MEMORY } },
],
script: percentSystemMemoryUsedScript,
additionalFilters: [systemMemoryFilter],
});
}

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -9,10 +9,7 @@ import type { AggregationOptionsByType } from '@kbn/es-types';
import { kqlQuery, rangeQuery } from '@kbn/observability-plugin/server';
import { ProcessorEvent } from '@kbn/observability-plugin/common';
import {
METRIC_CGROUP_MEMORY_USAGE_BYTES,
METRIC_PROCESS_CPU_PERCENT,
METRIC_SYSTEM_FREE_MEMORY,
METRIC_SYSTEM_TOTAL_MEMORY,
SERVICE_NAME,
SERVICE_NODE_NAME,
} from '../../../../common/es_fields/apm';
Expand All @@ -24,6 +21,8 @@ import { APMEventClient } from '../../../lib/helpers/create_es_client/create_apm
import {
percentCgroupMemoryUsedScript,
percentSystemMemoryUsedScript,
systemMemoryFilter,
cgroupMemoryFilter,
} from '../../metrics/by_agent/shared/memory';
import { getOffsetInMs } from '../../../../common/utils/get_offset_in_ms';

Expand Down Expand Up @@ -82,19 +81,6 @@ export async function getServiceInstancesSystemMetricStatistics<
numBuckets,
});

const systemMemoryFilter = {
bool: {
filter: [
{ exists: { field: METRIC_SYSTEM_FREE_MEMORY } },
{ exists: { field: METRIC_SYSTEM_TOTAL_MEMORY } },
],
},
};

const cgroupMemoryFilter = {
exists: { field: METRIC_CGROUP_MEMORY_USAGE_BYTES },
};

const cpuUsageFilter = { exists: { field: METRIC_PROCESS_CPU_PERCENT } };

function withTimeseries<TParams extends AggregationOptionsByType['avg']>(
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,77 @@
/*
* Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
* or more contributor license agreements. Licensed under the Elastic License
* 2.0; you may not use this file except in compliance with the Elastic License
* 2.0.
*/
import { apm, timerange } from '@kbn/apm-synthtrace-client';
import type { ApmSynthtraceEsClient } from '@kbn/apm-synthtrace';

const gigabytesToBytes = (value: number) => value * Math.pow(1024, 3);

export const config = {
memoryTotal: gigabytesToBytes(64),
memoryFree: gigabytesToBytes(5.5),
cGroupMemoryLimit: gigabytesToBytes(8),
cGroupMemoryUsage: gigabytesToBytes(1.5),
};

export const expectedValues = {
expectedMemoryUsedRate: (config.memoryTotal - config.memoryFree) / config.memoryTotal,
expectedMemoryUsed: config.memoryTotal - config.memoryFree,
};

export async function generateData({
synthtraceEsClient,
start,
end,
}: {
synthtraceEsClient: ApmSynthtraceEsClient;
start: number;
end: number;
}) {
const { memoryTotal, memoryFree, cGroupMemoryLimit, cGroupMemoryUsage } = config;

const systemMetricOnlyInstance = apm
.service({ name: 'system-metric-only-service', environment: 'production', agentName: 'go' })
.instance('system-metric-only-production');

const cGroupMemoryOnlyInstance = apm
.service({ name: 'cgroup-memory-only-service', environment: 'production', agentName: 'go' })
.instance('cgroup-memory-only-production');

const cGroupMemoryWithLimitInstance = apm
.service({
name: 'cgroup-memory-with-limit-production',
environment: 'production',
agentName: 'go',
})
.instance('cgroup-memory-with-limit-production');

const transactionsEvents = timerange(start, end)
.ratePerMinute(1)
.generator((timestamp) => [
systemMetricOnlyInstance
.appMetrics({
'system.memory.actual.free': memoryFree,
'system.memory.total': memoryTotal,
})
.timestamp(timestamp),
cGroupMemoryOnlyInstance
.appMetrics({
'system.process.cgroup.memory.mem.usage.bytes': cGroupMemoryUsage,
})
.timestamp(timestamp),

cGroupMemoryWithLimitInstance
.appMetrics({
'system.process.cgroup.memory.mem.usage.bytes': cGroupMemoryUsage,
'system.process.cgroup.memory.mem.limit.bytes': cGroupMemoryLimit,
'system.memory.total': memoryTotal,
'system.memory.actual.free': memoryFree,
})
.timestamp(timestamp),
]);

await synthtraceEsClient.index(transactionsEvents);
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,83 @@
/*
* Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
* or more contributor license agreements. Licensed under the Elastic License
* 2.0; you may not use this file except in compliance with the Elastic License
* 2.0.
*/

import expect from '@kbn/expect';
import { FtrProviderContext } from '../../../common/ftr_provider_context';
import { config, generateData } from './generate_data';

export default function ApiTest({ getService }: FtrProviderContext) {
const registry = getService('registry');
const apmApiClient = getService('apmApiClient');
const synthtraceEsClient = getService('synthtraceEsClient');

const start = new Date('2023-01-01T00:00:00.000Z').getTime();
const end = new Date('2023-01-01T00:15:00.000Z').getTime() - 1;

async function callMetricChartsAPI(serviceName: string) {
return await apmApiClient.readUser({
endpoint: `GET /internal/apm/services/{serviceName}/metrics/charts`,
params: {
path: { serviceName },
query: {
environment: 'production',
start: new Date(start).toISOString(),
end: new Date(end).toISOString(),
kuery: '',
agentName: 'go',
},
},
});
}

registry.when('Memory', { config: 'trial', archives: [] }, () => {
before(async () => {
await generateData({ start, end, synthtraceEsClient });
});

after(() => synthtraceEsClient.clean());

it('returns system memory stats', async () => {
const expectedFreeMemory = 1 - config.memoryFree / config.memoryTotal;

const { status, body } = await callMetricChartsAPI('system-metric-only-service');
const memoryChart = body.charts.find(({ key }) => key === 'memory_usage_chart');

expect(status).to.be(200);
[
{ title: 'Max', expectedValue: expectedFreeMemory },
{ title: 'Average', expectedValue: expectedFreeMemory },
].map(({ title, expectedValue }) => {
const series = memoryChart?.series.find((item) => item.title === title);
expect(series?.overallValue).to.eql(expectedValue);
});
});

it('returns cgroup memory with system.process.cgroup.memory.mem.limit.bytes', async () => {
const expectedFreeMemory = config.cGroupMemoryUsage / config.cGroupMemoryLimit;

const { status, body } = await callMetricChartsAPI('cgroup-memory-with-limit-production');
const memoryChart = body.charts.find(({ key }) => key === 'memory_usage_chart');

expect(status).to.be(200);
[
{ title: 'Max', expectedValue: expectedFreeMemory },
{ title: 'Average', expectedValue: expectedFreeMemory },
].map(({ title, expectedValue }) => {
const series = memoryChart?.series.find((item) => item.title === title);
expect(series?.overallValue).to.eql(expectedValue);
});
});

it('handles cgroup memory stats when system.process.cgroup.memory.mem.limit.bytes and system.memory.total are not present', async () => {
const { status, body } = await callMetricChartsAPI('cgroup-memory-only-production');
expect(status).to.be(200);

const memoryChart = body.charts.find(({ key }) => key === 'memory_usage_chart');
expect(memoryChart?.series).to.eql([]);
});
});
}
Loading

0 comments on commit 98165d2

Please sign in to comment.