Skip to content

Commit

Permalink
[CI] Archive logs from yarn es docker runs (#189231)
Browse files Browse the repository at this point in the history
## Summary
The problem we're trying to solve here is to get access to
`elasticsearch-serverless` logs when they're started in docker
containers in the background (and `elasticsearch`, although currently we
don't test against that in docker for now).
## Solution
In essence:
- we needed to remove the `--rm` flag, this would allow for the
containers to stay present after they're done.
- after this, we can run `docker logs ...` on FTR post-hooks, save
these, then archive these files to buildkite
- because the containers are not removed upon finishing, we need to
clean up dangling containers before starting up

Backporting is probably not necessary, because this is only applicable
for serverless - and serverless is only supposed to run on main.

Solves: #191505
(cherry picked from commit bce4a17)
  • Loading branch information
delanni committed Sep 16, 2024
1 parent 5f8e564 commit 3ad72b0
Show file tree
Hide file tree
Showing 6 changed files with 111 additions and 17 deletions.
1 change: 1 addition & 0 deletions .buildkite/scripts/lifecycle/post_command.sh
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,7 @@ if [[ "$IS_TEST_EXECUTION_STEP" == "true" ]]; then
buildkite-agent artifact upload 'x-pack/test/functional/failure_debug/html/*.html'
buildkite-agent artifact upload '.es/**/*.hprof'
buildkite-agent artifact upload 'data/es_debug_*.tar.gz'
buildkite-agent artifact upload '.es/es*.log'

if [[ $BUILDKITE_COMMAND_EXIT_STATUS -ne 0 ]]; then
if [[ $BUILDKITE_TRIGGERED_FROM_BUILD_PIPELINE_SLUG == 'elasticsearch-serverless-intake' ]]; then
Expand Down
6 changes: 4 additions & 2 deletions packages/kbn-es/src/utils/docker.test.ts
Original file line number Diff line number Diff line change
Expand Up @@ -665,12 +665,13 @@ describe('runServerlessCluster()', () => {

// docker version (1)
// docker ps (1)
// docker container rm (3)
// docker network create (1)
// docker pull (1)
// docker inspect (1)
// docker run (3)
// docker logs (1)
expect(execa.mock.calls).toHaveLength(9);
expect(execa.mock.calls).toHaveLength(12);
});

test(`should wait for serverless nodes to return 'green' status`, async () => {
Expand Down Expand Up @@ -806,11 +807,12 @@ describe('runDockerContainer()', () => {
await expect(runDockerContainer(log, {})).resolves.toBeUndefined();
// docker version (1)
// docker ps (1)
// docker container rm (3)
// docker network create (1)
// docker pull (1)
// docker inspect (1)
// docker run (1)
expect(execa.mock.calls).toHaveLength(6);
expect(execa.mock.calls).toHaveLength(9);
});
});

Expand Down
43 changes: 29 additions & 14 deletions packages/kbn-es/src/utils/docker.ts
Original file line number Diff line number Diff line change
Expand Up @@ -113,8 +113,6 @@ const DOCKER_REGISTRY = 'docker.elastic.co';
const DOCKER_BASE_CMD = [
'run',

'--rm',

'-t',

'--net',
Expand Down Expand Up @@ -151,8 +149,6 @@ export const ES_SERVERLESS_DEFAULT_IMAGE = `${ES_SERVERLESS_REPO_KIBANA}:${ES_SE
const SHARED_SERVERLESS_PARAMS = [
'run',

'--rm',

'--detach',

'--interactive',
Expand Down Expand Up @@ -391,7 +387,6 @@ const RETRYABLE_DOCKER_PULL_ERROR_MESSAGES = [
];

/**
*
* Pull a Docker image if needed. Ensures latest image.
* Stops serverless from pulling the same image in each node's promise and
* gives better control of log output, instead of falling back to docker run.
Expand Down Expand Up @@ -443,6 +438,24 @@ export async function printESImageInfo(log: ToolingLog, image: string) {
log.info(`Using ES image: ${imageFullName} (${revisionUrl})`);
}

export async function cleanUpDanglingContainers(log: ToolingLog) {
log.info(chalk.bold('Cleaning up dangling Docker containers.'));

try {
const serverlessContainerNames = SERVERLESS_NODES.map(({ name }) => name);

for (const name of serverlessContainerNames) {
await execa('docker', ['container', 'rm', name, '--force']).catch(() => {
// Ignore errors if the container doesn't exist
});
}

log.success('Cleaned up dangling Docker containers.');
} catch (e) {
log.error(e);
}
}

export async function detectRunningNodes(
log: ToolingLog,
options: ServerlessOptions | DockerOptions
Expand All @@ -454,19 +467,19 @@ export async function detectRunningNodes(
}, []);

const { stdout } = await execa('docker', ['ps', '--quiet'].concat(namesCmd));
const runningNodes = stdout.split(/\r?\n/).filter((s) => s);
const runningNodeIds = stdout.split(/\r?\n/).filter((s) => s);

if (runningNodes.length) {
if (runningNodeIds.length) {
if (options.kill) {
log.info(chalk.bold('Killing running ES Nodes.'));
await execa('docker', ['kill'].concat(runningNodes));

return;
await execa('docker', ['kill'].concat(runningNodeIds));
} else {
throw createCliError(
'ES has already been started, pass --kill to automatically stop the nodes on startup.'
);
}

throw createCliError(
'ES has already been started, pass --kill to automatically stop the nodes on startup.'
);
} else {
log.info('No running nodes detected.');
}
}

Expand All @@ -484,6 +497,7 @@ async function setupDocker({
}) {
await verifyDockerInstalled(log);
await detectRunningNodes(log, options);
await cleanUpDanglingContainers(log);
await maybeCreateDockerNetwork(log);
await maybePullDockerImage(log, image);
await printESImageInfo(log, image);
Expand Down Expand Up @@ -774,6 +788,7 @@ export async function runServerlessCluster(log: ToolingLog, options: ServerlessO
const volumeCmd = await setupServerlessVolumes(log, options);
const portCmd = resolvePort(options);

// This is where nodes are started
const nodeNames = await Promise.all(
SERVERLESS_NODES.map(async (node, i) => {
await runServerlessEsNode(log, {
Expand Down
73 changes: 73 additions & 0 deletions packages/kbn-es/src/utils/extract_and_archive_logs.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,73 @@
/*
* Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
* or more contributor license agreements. Licensed under the "Elastic License
* 2.0", the "GNU Affero General Public License v3.0 only", and the "Server Side
* Public License v 1"; you may not use this file except in compliance with, at
* your election, the "Elastic License 2.0", the "GNU Affero General Public
* License v3.0 only", or the "Server Side Public License, v 1".
*/

import type { ToolingLog } from '@kbn/tooling-log';

import execa from 'execa';
import Fsp from 'fs/promises';
import { join } from 'path';

import { REPO_ROOT } from '@kbn/repo-info';

/**
* Extracts logs from Docker nodes, writes them to files, and returns the file paths.
*/
export async function extractAndArchiveLogs({
outputFolder,
log,
nodeNames,
}: {
log: ToolingLog;
nodeNames?: string[];
outputFolder?: string;
}) {
outputFolder = outputFolder || join(REPO_ROOT, '.es');
const logFiles: string[] = [];

if (!nodeNames) {
const { stdout: nodeNamesString } = await execa('docker', [
'ps',
'-a',
'--format',
'{{.Names}}',
]);
nodeNames = nodeNamesString.split('\n').filter(Boolean);
}

if (!nodeNames.length) {
log.info('No Docker nodes found to extract logs from');
return;
} else {
log.info(`Attempting to extract logs from Docker nodes to ${outputFolder}`);
}

for (const name of nodeNames) {
const { stdout: nodeId } = await execa('docker', [
'ps',
'-a',
'--quiet',
'--filter',
`name=${name}`,
]);
if (!nodeId) {
continue;
}

const { stdout } = await execa('docker', ['logs', name]);
const targetFile = `${name}-${nodeId}.log`;
const targetPath = join(outputFolder, targetFile);

await Fsp.writeFile(targetPath, stdout);
logFiles.push(targetFile);

log.info(`Archived logs for ${name} to ${targetPath}`);
}

return logFiles;
}
1 change: 1 addition & 0 deletions packages/kbn-es/src/utils/index.ts
Original file line number Diff line number Diff line change
Expand Up @@ -20,3 +20,4 @@ export * from './parse_timeout_to_ms';
export * from './docker';
export * from './serverless_file_realm';
export * from './read_roles_from_resource';
export * from './extract_and_archive_logs';
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@ import type { ToolingLog } from '@kbn/tooling-log';
import getPort from 'get-port';
import { REPO_ROOT } from '@kbn/repo-info';
import type { ArtifactLicense, ServerlessProjectType } from '@kbn/es';
import { isServerlessProjectType } from '@kbn/es/src/utils';
import { isServerlessProjectType, extractAndArchiveLogs } from '@kbn/es/src/utils';
import type { Config } from '../../functional_test_runner';
import { createTestEsCluster, esTestConfig } from '../../es';

Expand Down Expand Up @@ -91,6 +91,7 @@ export async function runElasticsearch(
});
return async () => {
await node.cleanup();
await extractAndArchiveLogs({ outputFolder: logsDir, log });
};
}

Expand Down Expand Up @@ -119,6 +120,7 @@ export async function runElasticsearch(
return async () => {
await localNode.cleanup();
await remoteNode.cleanup();
await extractAndArchiveLogs({ outputFolder: logsDir, log });
};
}

Expand Down

0 comments on commit 3ad72b0

Please sign in to comment.