hotsanic |
Subversion Repositories: |
Compare with Previous - Blame - Download
#
# $Id: HotSaNIClogparse.pm,v 1.1 2004/02/08 20:42:05 bernisys Exp $
#
package HotSaNIClogparse;
($VERSION = '$Revision: 1.1 $') =~ s/.*(\d+\.\d+).*/$1/;
my %datehash=(Jan=>0,Feb=>1,Mar=>2,Apr=>3,May=>4,Jun=>5,Jul=>6,Aug=>7,Sep=>8,Oct=>9,Nov=>10,Dec=>11);
######################################################################
#
# finds logfiles that are not already parsed.
#
# USAGE: ($position,@files)=findlogs($dir,$names,$infofile);
#
# $dir the directory that contains the desired logfiles
#
# $names a regex that matches all desired logs
#
# $infofile is the path to a file where some information about
# the last parsing process has been stored.
#
#
# $position will be the position where the last parsing process stopped
#
# @files is an array containing all "newer" (i.e. unparsed) logs
# in hopefully the right order. This list can be parsed
# within a "foreach (@files) {...}" construct.
#
sub findlogs {
my $logdir = shift;
my $logfile = shift;
my $lastinfo = shift;
my @files;
use File::Find;
File::Find::find( {wanted => sub { /^$logfile\z/s && push @files,$File::Find::name; } }, $logdir);
my @sfiles = sort @files;
my $firstline="*** no lastfile found ***";
my $position=0;
if (-e $lastinfo) {
open FILE,$lastinfo;
$firstline=<FILE> || "*** empty lastfile ***";
$position=<FILE> || 0;
close FILE;
}
undef @files;
my $found=0;
while ($found==0) {
if (@sfiles) {
my $file=shift @sfiles;
open FILE,"$file";
my $line=<FILE>;
close FILE;
unshift @files,$file;
if ($line eq $firstline) { $found=1; }
}
else { $found=-1 }
}
if ($found < 0) { $position=0; }
return ($position,@files);
}
######################################################################
#
# parse a line of an apache logfile and return it splitted in a hash
#
sub parseline_apache {
my $line=shift || "";
my %info;
$line =~ /^([0-9]+\.[0-9]+\.[0-9]+\.[0-9]+) (.*?) (.*?) \[(.*?) (.*?)\] \"(\w+) (.*?) (.*?)\" ([0-9]+) ([0-9]+) \"(.*?)\" \"(.*?)\"$/, $info{IP}=$1,$info{REQuser}=$2,$info{REQauthuser}=$3,$info{TS}=$4,$info{TSzone}=$5,$info{REQtype}=$6,$info{REQwhat}=$7,$info{REQformat}=$8,$info{RETcode}=$9,$info{RETsize}=$10,$info{REQreferer}=$11,$info{REQagent}=$12;
$info{TS} =~ /([0-9]+)\/(\w+)\/([0-9]+)\:([0-9]+)\:([0-9]+)\:([0-9]+)/,$info{TSday}=$1*1,$info{TSmname}=$2,$info{TSyear}=$3,$info{TShour}=$4*1,$info{TSminute}=$5*1,$info{TSsecond}=$6*1;
$info{TSmonth}=$datehash{$info{TSmname}};
$info{TSzone} =~ /^(.)([0-9][0-9])/,$info{TSzdiff}=$1.$2*1;
$info{TStime} = time_to_seconds($info{TSyear},$info{TSmonth},$info{TSday},$info{TShour},$info{TSminute},$info{TSsecond});
return %info;
}
######################################################################
#
# converts year, month, mday, hour, minute and second
# into a timestamp such as time() produces.
#
# How? heh, heh. Binary search. :)
# Try setting/unsetting bits starting from the high end until
# localtime($result) matches the input time.
#
sub time_to_seconds {
my $a = sprintf "%04d%02d%02d%02d%02d%02d",@_;
my ($l_sec,$l_min,$l_hour,$l_mday,$l_mon,$l_year,$l_wday,$l_yday,$l_isdst);
my ($result, $bit, $i);
$result = 0;
# For each bit in the value, starting with the highest bit...
#
$bit=1024*1024*1024;
for (my $n=30;$n>=0; $n--) {
$bit=1<<$n;
$result += $bit; # Try setting it...
# Get the time info for that time...
($l_sec,$l_min,$l_hour,$l_mday,$l_mon,$l_year,$l_wday,$l_yday,$l_isdst) = localtime($result);
$l_year+=1900;
$l_mon+=1;
my $b = sprintf "%04d%02d%02d%02d%02d%02d",$l_year,$l_mon,$l_mday,$l_hour,$l_min,$l_sec;
$result -= $bit if ($a lt $b);
}
return($result);
}
1;