jablonka.czprosek.czf

hotsanic

Subversion Repositories:
[/] [trunk/] [lib/] [HotSaNIClogparse.pm] - Rev 20 Go to most recent revision

Compare with Previous - Blame - Download


#
# $Id: HotSaNIClogparse.pm,v 1.1 2004/02/08 20:42:05 bernisys Exp $
#

package HotSaNIClogparse;

($VERSION = '$Revision: 1.1 $') =~ s/.*(\d+\.\d+).*/$1/;

my %datehash=(Jan=>0,Feb=>1,Mar=>2,Apr=>3,May=>4,Jun=>5,Jul=>6,Aug=>7,Sep=>8,Oct=>9,Nov=>10,Dec=>11);

######################################################################
#
# finds logfiles that are not already parsed.
#
# USAGE: ($position,@files)=findlogs($dir,$names,$infofile);
#
#  $dir       the directory that contains the desired logfiles
#
#  $names     a regex that matches all desired logs
#
#  $infofile  is the path to a file where some information about
#             the last parsing process has been stored.
#
#
#  $position  will be the position where the last parsing process stopped
#
#  @files     is an array containing all "newer" (i.e. unparsed) logs
#             in hopefully the right order. This list can be parsed
#             within a "foreach (@files) {...}" construct.
#
sub findlogs {
  my $logdir = shift;
  my $logfile = shift;
  my $lastinfo = shift;

  my @files;
  use File::Find;
  File::Find::find( {wanted => sub { /^$logfile\z/s && push @files,$File::Find::name; } }, $logdir);

  my @sfiles = sort @files;

  my $firstline="*** no lastfile found ***";
  my $position=0;
  if (-e $lastinfo) {
    open FILE,$lastinfo;
    $firstline=<FILE> || "*** empty lastfile ***";
    $position=<FILE> || 0;
    close FILE;
    }

  undef @files;
  my $found=0;
  while ($found==0) {
    if (@sfiles) {
      my $file=shift @sfiles;
      open FILE,"$file";
      my $line=<FILE>;
      close FILE;
      unshift @files,$file;
      if ($line eq $firstline) { $found=1; }
      }
    else { $found=-1 }
    }

  if ($found < 0) { $position=0; }

  return ($position,@files);
  }



######################################################################
#
# parse a line of an apache logfile and return it splitted in a hash
#
sub parseline_apache {
  my $line=shift || "";
  my %info;

  $line =~ /^([0-9]+\.[0-9]+\.[0-9]+\.[0-9]+) (.*?) (.*?) \[(.*?) (.*?)\] \"(\w+) (.*?) (.*?)\" ([0-9]+) ([0-9]+) \"(.*?)\" \"(.*?)\"$/, $info{IP}=$1,$info{REQuser}=$2,$info{REQauthuser}=$3,$info{TS}=$4,$info{TSzone}=$5,$info{REQtype}=$6,$info{REQwhat}=$7,$info{REQformat}=$8,$info{RETcode}=$9,$info{RETsize}=$10,$info{REQreferer}=$11,$info{REQagent}=$12;
  
  $info{TS} =~ /([0-9]+)\/(\w+)\/([0-9]+)\:([0-9]+)\:([0-9]+)\:([0-9]+)/,$info{TSday}=$1*1,$info{TSmname}=$2,$info{TSyear}=$3,$info{TShour}=$4*1,$info{TSminute}=$5*1,$info{TSsecond}=$6*1;
  $info{TSmonth}=$datehash{$info{TSmname}};

  $info{TSzone} =~ /^(.)([0-9][0-9])/,$info{TSzdiff}=$1.$2*1;

  $info{TStime} = time_to_seconds($info{TSyear},$info{TSmonth},$info{TSday},$info{TShour},$info{TSminute},$info{TSsecond});

  return %info;
  }


######################################################################
# 
# converts year, month, mday, hour, minute and second
# into a timestamp such as time() produces.
#
# How?  heh, heh.  Binary search. :)
# Try setting/unsetting bits starting from the high end until 
# localtime($result) matches the input time.
#
sub time_to_seconds {
  my $a = sprintf "%04d%02d%02d%02d%02d%02d",@_;
  my ($l_sec,$l_min,$l_hour,$l_mday,$l_mon,$l_year,$l_wday,$l_yday,$l_isdst);
  my ($result, $bit, $i);
    
  $result = 0;
    
  # For each bit in the value, starting with the highest bit...
  #
  $bit=1024*1024*1024;
  for (my $n=30;$n>=0; $n--) {
    $bit=1<<$n;

    $result += $bit;    # Try setting it...
    
    # Get the time info for that time...
    ($l_sec,$l_min,$l_hour,$l_mday,$l_mon,$l_year,$l_wday,$l_yday,$l_isdst) = localtime($result);
    
    $l_year+=1900;
    $l_mon+=1;

    my $b = sprintf "%04d%02d%02d%02d%02d%02d",$l_year,$l_mon,$l_mday,$l_hour,$l_min,$l_sec;
    
    $result -= $bit if ($a lt $b);
    }
    
  return($result);
  }

1;


Powered by WebSVN 2.2.1