From eeac8ec2a92c97b23f7e4a3ab917f466bb775d1f Mon Sep 17 00:00:00 2001 From: Matt Rendina Date: Fri, 11 Oct 2019 11:55:44 -0400 Subject: Relocate module file --- conmets/conmets.py | 484 +++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 484 insertions(+) create mode 100755 conmets/conmets.py (limited to 'conmets/conmets.py') diff --git a/conmets/conmets.py b/conmets/conmets.py new file mode 100755 index 0000000..b083ede --- /dev/null +++ b/conmets/conmets.py @@ -0,0 +1,484 @@ +#!/usr/bin/env python3 +import os +import sys +import re +from glob import glob +import pickle +from math import ceil +import hashlib +import gzip +import socket +import pandas as pd +import datetime as dt +import matplotlib.pyplot as plt +import matplotlib.dates as mdates +from dateutil import parser as dpar +from collections import OrderedDict + + +def md5(fname): + hash_md5 = hashlib.md5() + with open(fname, "rb") as f: + for chunk in iter(lambda: f.read(4096), b""): + hash_md5.update(chunk) + return hash_md5.hexdigest() + + +# regex pattern to extract key values from each line of an apache/nginx access log +# Accommodate PUTs as well as second URLs (normally "-") +patt = '(?P\\d{1,3}\\.\\d{1,3}\\.\\d{1,3}\\.\\d{1,3}) .* .* \\[(?P\\d{2}\\/[a-zA-Z]{3}\\/\\d{4}):(?P