2019-04-17 19:25:11 +02:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
import os
|
2019-04-18 09:35:33 +02:00
|
|
|
import sys
|
2019-04-17 19:25:11 +02:00
|
|
|
import json
|
|
|
|
import socket
|
2019-04-18 09:35:33 +02:00
|
|
|
import logging
|
2019-04-17 19:25:11 +02:00
|
|
|
import requests
|
|
|
|
from datetime import datetime
|
|
|
|
from optparse import OptionParser
|
|
|
|
from elasticsearch import Elasticsearch
|
|
|
|
|
2019-04-18 09:35:33 +02:00
|
|
|
HELP_DESCRIPTION='This script collects latest log entries for provided messages from all nodes in a Nimbus fleet'
|
|
|
|
HELP_EXAMPLE='Example: collect -i logstash-2019.03.01 output.json'
|
|
|
|
DEFAULT_MESSAGES = [
|
|
|
|
'Fork chosen',
|
|
|
|
'Attestation received',
|
|
|
|
'Slot start',
|
|
|
|
]
|
|
|
|
|
2019-04-17 19:25:11 +02:00
|
|
|
ENV = os.environ
|
2019-04-18 09:35:33 +02:00
|
|
|
LOG = logging.getLogger('root')
|
|
|
|
handler = logging.StreamHandler(sys.stderr)
|
2020-02-19 11:51:09 +01:00
|
|
|
formatter = logging.Formatter('[%(levelname)s]: %(message)s')
|
2019-04-18 09:35:33 +02:00
|
|
|
handler.setFormatter(formatter)
|
|
|
|
LOG.addHandler(handler)
|
2019-04-17 19:25:11 +02:00
|
|
|
|
|
|
|
class ES:
|
2020-02-19 11:51:09 +01:00
|
|
|
def __init__(self, host, port, page_size, timeout):
|
2019-04-17 19:25:11 +02:00
|
|
|
self.page_size = page_size
|
2020-02-19 11:51:09 +01:00
|
|
|
self.es = Elasticsearch([host], port=port, timeout=timeout)
|
2019-04-17 19:25:11 +02:00
|
|
|
|
2019-04-19 12:50:55 +02:00
|
|
|
def make_query(self, fleet, program, messages, after):
|
2019-04-17 19:25:11 +02:00
|
|
|
return {
|
|
|
|
'query': { 'bool': {
|
|
|
|
'must': [
|
|
|
|
{ 'match': { 'fleet': fleet } },
|
|
|
|
{ 'match': { 'program': program } },
|
|
|
|
{ 'range': { '@timestamp': { 'gt': after } } },
|
|
|
|
],
|
2019-04-19 12:50:55 +02:00
|
|
|
'should': [
|
|
|
|
{ 'match_phrase': { 'message': msg } } for msg in messages
|
|
|
|
],
|
|
|
|
'minimum_should_match': 1,
|
2019-04-17 19:25:11 +02:00
|
|
|
}, },
|
|
|
|
'sort': [
|
|
|
|
{ '@timestamp': { 'order': 'desc' } },
|
|
|
|
],
|
|
|
|
}
|
2022-07-04 15:07:55 +02:00
|
|
|
|
2019-04-17 19:25:11 +02:00
|
|
|
def _index(self):
|
2022-07-04 15:07:55 +02:00
|
|
|
return
|
|
|
|
|
2019-04-17 19:25:11 +02:00
|
|
|
def get_logs(self, query):
|
|
|
|
return self.es.search(
|
|
|
|
index=self._index(),
|
|
|
|
body=query,
|
|
|
|
size=self.page_size
|
|
|
|
)
|
|
|
|
|
|
|
|
def get_first_for_node(logs):
|
|
|
|
data = {}
|
|
|
|
for log_obj in logs:
|
|
|
|
log = log_obj['_source']
|
|
|
|
host_obj = data.setdefault(log['logsource'], {})
|
2019-04-19 12:50:55 +02:00
|
|
|
# remove "docker/" prefix from program name
|
|
|
|
program = log['program'].replace('docker/', '')
|
|
|
|
prog_obj = host_obj.setdefault(program, {})
|
2019-04-17 19:25:11 +02:00
|
|
|
prog_obj[log['message']] = json.loads(log['raw'])
|
|
|
|
return data
|
|
|
|
|
2019-04-19 12:50:55 +02:00
|
|
|
def save_stats(data, output_file):
|
|
|
|
# add metadata for easier debugging
|
|
|
|
output = {
|
|
|
|
'meta': {
|
|
|
|
'hostname': socket.gethostname(),
|
|
|
|
'timestamp': datetime.utcnow().isoformat(),
|
|
|
|
},
|
|
|
|
'data': data,
|
|
|
|
}
|
2022-07-04 15:07:55 +02:00
|
|
|
|
2019-04-19 12:50:55 +02:00
|
|
|
if output_file:
|
|
|
|
LOG.info('Saving to file: %s', output_file)
|
|
|
|
with open(output_file, 'w') as f:
|
|
|
|
json.dump(data, f, indent=4)
|
|
|
|
else:
|
|
|
|
LOG.info('Printing results to STDOUT')
|
|
|
|
print(json.dumps(data, indent=4))
|
|
|
|
|
2019-04-17 19:25:11 +02:00
|
|
|
def parse_opts():
|
|
|
|
parser = OptionParser(description=HELP_DESCRIPTION, epilog=HELP_EXAMPLE)
|
|
|
|
parser.add_option('-i', '--index', dest='es_index',
|
|
|
|
default='logstash-'+datetime.today().strftime('%Y.%m.%d'),
|
|
|
|
help='Patter for matching indices. (%default)')
|
2019-04-18 09:35:33 +02:00
|
|
|
parser.add_option('-m', '--messages', action="append", default=DEFAULT_MESSAGES,
|
|
|
|
help='Messages to query for. (%default)')
|
2019-04-17 19:25:11 +02:00
|
|
|
parser.add_option('-H', '--host', dest='es_host', default='localhost',
|
|
|
|
help='ElasticSearch host. (%default)')
|
|
|
|
parser.add_option('-P', '--port', dest='es_port', default=9200,
|
|
|
|
help='ElasticSearch port. (%default)')
|
|
|
|
parser.add_option('-p', '--program', default='*beacon-node-*',
|
|
|
|
help='Program to query for. (%default)')
|
2020-02-19 11:51:09 +01:00
|
|
|
parser.add_option('-s', '--since', default='now-15m',
|
2019-04-17 19:25:11 +02:00
|
|
|
help='Period for which to query logs. (%default)')
|
|
|
|
parser.add_option('-S', '--page-size', default=10000,
|
|
|
|
help='Size of results page. (%default)')
|
|
|
|
parser.add_option('-f', '--fleet', default='nimbus.test',
|
|
|
|
help='Fleet to query for. (%default)')
|
2020-02-19 11:51:09 +01:00
|
|
|
parser.add_option('-t', '--timeout', default=120,
|
|
|
|
help='Connection timeout in seconds. (%default)')
|
2019-04-18 09:35:33 +02:00
|
|
|
parser.add_option('-l', '--log-level', default='INFO',
|
|
|
|
help='Logging level. (%default)')
|
2019-04-17 19:25:11 +02:00
|
|
|
parser.add_option('-o', '--output-file',
|
|
|
|
help='File to which write the resulting JSON.')
|
2022-07-04 15:07:55 +02:00
|
|
|
|
2019-04-17 19:25:11 +02:00
|
|
|
return parser.parse_args()
|
|
|
|
|
2019-04-18 09:35:33 +02:00
|
|
|
def debug_options(opts):
|
|
|
|
LOG.debug('Settings:')
|
|
|
|
for key, val in opts.__dict__.items():
|
|
|
|
LOG.debug('%s=%s', key, val)
|
|
|
|
|
2019-04-17 19:25:11 +02:00
|
|
|
def main():
|
|
|
|
(opts, args) = parse_opts()
|
2019-04-18 09:35:33 +02:00
|
|
|
LOG.setLevel(opts.log_level)
|
|
|
|
|
|
|
|
debug_options(opts)
|
2019-04-17 19:25:11 +02:00
|
|
|
|
2020-02-19 11:51:09 +01:00
|
|
|
es = ES(opts.es_host, opts.es_port, opts.page_size, opts.timeout)
|
2022-07-04 15:07:55 +02:00
|
|
|
|
2019-04-18 09:35:33 +02:00
|
|
|
LOG.info('Querying fleet: %s', opts.fleet)
|
2019-04-19 12:50:55 +02:00
|
|
|
query = es.make_query(opts.fleet, opts.program, opts.messages, opts.since)
|
|
|
|
rval = es.get_logs(query)
|
|
|
|
|
2020-02-19 11:51:09 +01:00
|
|
|
LOG.info('Found matching logs: %d', rval['hits']['total']['value'])
|
2019-04-19 12:50:55 +02:00
|
|
|
logs = rval['hits']['hits']
|
2022-07-04 15:07:55 +02:00
|
|
|
|
2019-04-17 19:25:11 +02:00
|
|
|
data = get_first_for_node(logs)
|
2022-07-04 15:07:55 +02:00
|
|
|
|
2019-04-19 12:50:55 +02:00
|
|
|
save_stats(data, opts.output_file)
|
2019-04-17 19:25:11 +02:00
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
main()
|