contrib-munin/plugins/apache/apache_users

171 lines
4.5 KiB
Bash
Executable File

#!/bin/bash
#
# apache_users - Munin plugin, displays traffic by user
#
# Version: 03.06.2009
# Author: Rainer Wolff <rainer.wolff@gmx.com>
#
# ################################################################################ MAGIC MARKERS
#%# family=contrib
#%# capabilities=autoconf
# ####################################################################################### CONFIG
DIRECTORY=${MUNIN_PLUGINSTATE:-/var/lib/munin/plugin-state/apache_users}
TIMESTAMP=$DIRECTORY/.apache_users
ACCESSLOG=/var/log/apache2/access_log
# ##################################################################################### AUTOCONF
if [ "$1" = "autoconf" ]
then
if ! ls $ACCESSLOG > /dev/null
then
echo "no (could not find apache access log \"$ACCESSLOG\")"
exit 1
elif ! ls $DIRECTORY > /dev/null
then
echo "no (could not find munin plugins directory \"$DIRECTORY\")"
exit 2
else
echo "yes"
exit 0
fi
fi
# ######################################################################################### INIT
# Define regex for all possible timestamps of last 5 minutes block
REGEX=$(LC_ALL=en_US date -d "5 minutes ago" "+\[%d\/%b\/%Y:%H: %M :[0-5][0-9] %z\]" \
| awk '{ printf "%s(%02d|%02d|%02d|%02d|%02d)%s", $1, $2-$2%5, $2-$2%5+1, $2-$2%5+2, $2-$2%5+3, $2-$2%5+4, $3 }')
# Analyse logfile
while read REQUEST_ADDR REQUEST_USERNAME REQUEST_BYTES
do
# Name resolution for known addresses
REQUEST_DOMAIN=$( awk '/^'"$REQUEST_ADDR"'/ { print $2 }' /etc/hosts )
REQUEST_ADDR=${REQUEST_DOMAIN:-$REQUEST_ADDR}
# Scan for known addresses, if found, sum up traffic
FOUND=false
for (( I=${#ADDR[@]}-1; I>=0; I-- ))
do
# Address known, name maybe, anonymous access (again)
if [ "${ADDR[I]}" == "$REQUEST_ADDR" -a "$REQUEST_USERNAME" == "-" ]
then
FOUND=true
BYTES[$I]=$(( ${BYTES[I]} + $REQUEST_BYTES ))
break
# Known address and name
elif [ "${ADDR[I]}" == "$REQUEST_ADDR" -a "${USERNAME[I]}" == "$REQUEST_USERNAME" ]
then
FOUND=true
BYTES[$I]=$(( ${BYTES[I]} + $REQUEST_BYTES ))
break
# Known address, previous access anonymous
elif [ "${ADDR[I]}" == "$REQUEST_ADDR" -a "${USERNAME[I]}" == "-" ]
then
FOUND=true
USERNAME[$I]="$REQUEST_USERNAME"
BYTES[$I]=$(( ${BYTES[I]} + $REQUEST_BYTES ))
break
fi
done
# Combination of address and name unknown, create new entry
if [ "$FOUND" == "false" ]
then
ADDR[${#ADDR[@]}]=$REQUEST_ADDR
USERNAME[${#USERNAME[@]}]="$REQUEST_USERNAME"
BYTES[${#BYTES[@]}]=$REQUEST_BYTES
fi
done < <( awk '/'"$REGEX"'/ { printf "%s %s %d\n", $1, $3, $10 }' $ACCESSLOG )
# Assign anonymous access when possible and correct identifiers
for (( I=0; I<${#USERNAME[@]}; I++ ))
do
if [ "${USERNAME[I]}" == "-" ]
then
if $( echo "${ADDR[I]}" | egrep -q "[^0-9.]" )
then
USERNAME[$I]="${ADDR[I]}"
else
USERNAME[$I]="anonymous"
fi
NAME[$I]="_${USERNAME[I]}" # Output sort order
else
NAME[$I]="${USERNAME[I]}"
fi
NAME[$I]="$( echo "${NAME[I]}" \
| sed "s/^[^A-Za-z_]/_/" | sed "s/[^A-Za-z0-9_]/_/g" \
| sed "s/^\(.\{,19\}\).*/\1/" )"
done
# Create timestamp
mkdir -p $DIRECTORY
touch -d "-1 second" $TIMESTAMP # find needs time span
# Aggregate parallel traffic
for (( I=0; I<${#NAME[@]}; I++ ))
do
if [ -z "$( find $DIRECTORY -name "${NAME[I]}" -newer $TIMESTAMP )" ]
then
echo "${NAME[I]} ${BYTES[I]} ${USERNAME[I]}" > $DIRECTORY/${NAME[I]}
else
awk '{ printf "%s %d %s", $1, $2+${BYTES[I]}, $3 }' $DIRECTORY/${NAME[I]} > $DIRECTORY/${NAME[I]}
fi
done
# ####################################################################################### CONFIG
if [ "$1" = "config" ]
then
echo "graph_title Apache users"
echo "graph_vlabel bytes per five minute period"
echo "graph_args --lower-limit 1 --base 1024 --logarithmic"
echo "graph_category webserver"
echo "graph_total total"
echo "graph_info Webserver traffic by user."
FILENAMES=$( find $DIRECTORY -type f -not -wholename $TIMESTAMP | sort)
awk '{ printf "%s.label %s\n%s.draw AREA\n", $1, $3, $1 }' $( echo "$FILENAMES" | head -n1 )
for FILENAME in $( echo "$FILENAMES" | tail -n+2)
do
awk '{ printf "%s.label %s\n%s.draw STACK\n", $1, $3, $1 }' $FILENAME
done
exit 0
fi
# ######################################################################################## VALUE
{
for FILENAME in $( find $DIRECTORY -type f -newer $TIMESTAMP -not -wholename $TIMESTAMP )
do
awk '{ printf "%s.value %d\n", $1, $2 }' $FILENAME
done
for FILENAME in $( find $DIRECTORY -type f -not -newer $TIMESTAMP -not -wholename $TIMESTAMP )
do
awk '{ printf "%s.value 0\n", $1 }' $FILENAME
done
} | sort
exit 0