Log aggregation in AWS - part 2 - keeping your index under control - ASP.Net & Sitecore Blog

This is the second part in the series as a follow on to /log-aggregation-aws-part-1/

Hopefully by this point you’ve now got kibana up and running, gathering all the logs from each of your desired CloudWatch groups. Over time the amount of data being stored in the index will constantly be growing so we need to keep things under control.

Here is a good view of the issue. We introduced our cleanup lambda on the 30th, if we hadn’t I reckon we’d have about 2 days more uptime before the disks ran out. The oscillating items from the 31st onward are exactly what we’d want to see – we delete indices older than 10 days every day.

Initially this was done via a scheduled task from a box we host – it worked but wasn’t ideal as it relies on the box running, potentially user creds and lots more. What seemed a better fit was to use AWS Lambda to keep our index under control.

Getting setup

Luckily you don’t need to setup much for this. One AWS Lambda, a trigger and some role permissions and you should be up and running.

Create a new lambda function based off the script shown below
Add 2 environment variables:
1. daysToKeep=10
2. endpoint=elastic search endpoint e.g. search-###-###.eu-west-1.es.amazonaws.com

Create a new role as part of the setup process

Note, these can then be found in the IAM section of AWS e.g. https://console.aws.amazon.com/iam/home?region=eu-west-1#/roles
Update the role to allow Get and Delete access to your index with the policy:

{
    "Version": "2012-10-17",
    "Statement": [
        {
            "Effect": "Allow",
            "Action": [
                "es:ESHttpGet",
                "es:ESHttpDelete"
            ],
            "Resource": "ARN of elastic search index"
        }
    ]
}

{

"Version": "2012-10-17",

"Statement": [

{

"Effect": "Allow",

"Action": [

"es:ESHttpGet",

"es:ESHttpDelete"

"Resource": "ARN of elastic search index"

}

]

}

Setup a trigger (in CloudWatch -> Events -> Rules)
1. Here you can set the frequency of how often to run e.g. a CRON of
  
  0 2 * * ? *
  
  1
  
  0 2 * * ? *
  
  will run at 2am every night
Test your function, you can always run on demand and then check whether the indices have been removed

And finally the lambda code:

var AWS = require('aws-sdk');

var endpoint; 
var creds = new AWS.EnvironmentCredentials('AWS');

Date.prototype.addDays = function(days) {
	var dat = new Date(this.valueOf());
	dat.setDate(dat.getDate() + days);
	return dat;
}

exports.handler = function(input, context)
{
	endpoint = new AWS.Endpoint(process.env.endpoint);

	let dateBaseline = new Date();

	dateBaseline = dateBaseline.addDays(-parseInt(process.env.daysToKeep));

	console.log("Date baseline: " + dateBaseline.toISOString());

	getIndices(context, function(data)
	{
		data.split('\n').forEach((row) =>
			{
				let parts = row.split(" ");
				
				if (parts.length > 2)
				{
					let indiceName = parts[2];

					if (indiceName.indexOf("cwl") > -1)
					{
						let indiceDate = new Date(indiceName.substr(4, 4), indiceName.substr(9, 2)-1, indiceName.substr(12, 2));
						
						if (indiceDate < dateBaseline)
						{
							console.log("Planning to delete indice: " + indiceName);

							removeIndice("/"+indiceName, context);
						}
					}
				}
			});
	});
}

function removeIndice(indiceName, context) 
{
	makeRequest("DELETE", indiceName, context);
}

function getIndices(context, callback)
{
	makeRequest("GET", '/_cat/indices', context, callback);
}

function makeRequest(method, path, context, callback)
{
	console.log(`Making ${method} call to ${path}`);

	var req = new AWS.HttpRequest(endpoint);

	req.method = method;
	req.path = path;
	req.region = "eu-west-1";
	req.headers['presigned-expires'] = false;
	req.headers['Host'] = endpoint.host;

	var signer = new AWS.Signers.V4(req, 'es');
	signer.addAuthorization(creds, new Date());

	var send = new AWS.NodeHttpClient();
	send.handleRequest(req,
		null,
		function(httpResp)
		{
			var respBody = '';
			httpResp.on('data',
				function(chunk)
				{
					respBody += chunk;
				});
			httpResp.on('end',
				function(chunk)
				{
					if (callback)
					{
						callback(respBody);
					}
					//console.log(respBody);
				});
		},
		function(err)
		{
			console.log('Error: ' + err);
			context.fail('Lambda failed with error ' + err);
		});
}

var AWS = require('aws-sdk');

var endpoint;

var creds = new AWS.EnvironmentCredentials('AWS');

Date.prototype.addDays = function(days) {

var dat = new Date(this.valueOf());

dat.setDate(dat.getDate() + days);

return dat;

}

exports.handler = function(input, context)

{

endpoint = new AWS.Endpoint(process.env.endpoint);

let dateBaseline = new Date();

dateBaseline = dateBaseline.addDays(-parseInt(process.env.daysToKeep));

console.log("Date baseline: " + dateBaseline.toISOString());

getIndices(context, function(data)

{

data.split('\n').forEach((row) =>

{

let parts = row.split(" ");

if (parts.length > 2)

{

let indiceName = parts[2];

if (indiceName.indexOf("cwl") > -1)

{

let indiceDate = new Date(indiceName.substr(4, 4), indiceName.substr(9, 2)-1, indiceName.substr(12, 2));

if (indiceDate < dateBaseline)

{

console.log("Planning to delete indice: " + indiceName);

removeIndice("/"+indiceName, context);

}

});

}

function removeIndice(indiceName, context)

{

makeRequest("DELETE", indiceName, context);

}

function getIndices(context, callback)

{

makeRequest("GET", '/_cat/indices', context, callback);

}

function makeRequest(method, path, context, callback)

{

console.log(`Making ${method} call to ${path}`);

var req = new AWS.HttpRequest(endpoint);

req.method = method;

req.path = path;

req.region = "eu-west-1";

req.headers['presigned-expires'] = false;

req.headers['Host'] = endpoint.host;

var signer = new AWS.Signers.V4(req, 'es');

signer.addAuthorization(creds, new Date());

var send = new AWS.NodeHttpClient();

send.handleRequest(req,

null,

function(httpResp)

{

var respBody = '';

httpResp.on('data',

function(chunk)

{

respBody += chunk;

});

httpResp.on('end',

function(chunk)

{

if (callback)

{

callback(respBody);

}

//console.log(respBody);

});

function(err)

{

console.log('Error: ' + err);

context.fail('Lambda failed with error ' + err);

});

}

Note, if you are running in a different region you will need to tweak req.region = “eu-west-1”;

How does it work?

Elastic search allows you to query the index to find all indices via the url: /_cat/indices. The lambda function makes a web request to this url, parses each row and finds any indices that match the name: cwl-YYYY.MM.dd. If an indice is found that is older than days to keep, a delete request is issued to elasticSearch

Was this the best option?

There are tools available for cleaning up old indices, even ones that Elastic themselves provide: https://github.com/elastic/curator however this requires additional boxes to run hence the choice for keeping it wrapped in a simple lambda.

Happy indexing!

4 thoughts on “Log aggregation in AWS – part 2 – keeping your index under control”

Martin Gladdish says:

October 1, 2017 at 8:56 am

Thanks, this was extremely useful. Simple and to the point.

harish says:

November 8, 2017 at 7:27 pm

Hi,

Nice article.

I am newbie. When you create Lambda function what type of Runtime do we have to select (c#, java 8, node.js 4.3, jode.js 6.10, python 2.7, python 3.6)

Do we have to specify VPC and Subnet for this when we creating the function.

Finally, how do test this please manually. Detail steps would be very helpful.

Many thanks

- boro says:
  
  November 14, 2017 at 4:14 pm
  
  These functions are done in javascript so would be node. We run as 4.3.
  You can leave the VPC (and subnet) blank, unless you need to run within a secure network you own.
  
- boro says:
  
  November 14, 2017 at 4:15 pm
  
  To test the function you can run from within the AWS console, rather than waiting for the timed trigger to kick in.

blog.boro2g .co.uk

Some ideas about coding, dev and all things online.

Log aggregation in AWS – part 2 – keeping your index under control

4 thoughts on “Log aggregation in AWS – part 2 – keeping your index under control”

Leave a Reply Cancel reply