2 /**************************************************************************
3 ** (c) Copyright 2002, Andromeda Technology & Automation
4 ** This is free software; you can redistribute it and/or modify it under the
5 ** terms of the GNU General Public License, see the file COPYING.
6 ***************************************************************************
7 ** MODULE INFORMATION *
8 ***********************
9 ** FILE NAME : access_cooker.cpp
11 ** VERSION NUMBER : $Revision: 1.2 $
13 ** DESCRIPTION : Cooks Apache http daemon access log lines
18 ***************************************************************************
19 ** ADMINISTRATIVE INFORMATION *
20 ********************************
21 ** ORIGINAL AUTHOR : Arjen Baart - arjen@andromeda.nl
22 ** CREATION DATE : Aug 11, 2003
23 ** LAST UPDATE : Aug 11, 2003
25 **************************************************************************/
27 /*****************************
28 $Log: access_cooker.cpp,v $
29 Revision 1.2 2003-12-04 10:38:09 arjen
30 Major redesign. All input is handled through XML. Raw input data is first
31 transformed into an XML document for further processing.
32 A collection of polymorphic classes handle the transformation of various
33 input formats into XML.
34 Classifying input data is done with a finite improbability calculation.
36 Revision 1.1 2003/08/11 16:56:15 arjen
37 Different kinds of log files are parsed by a collection of objects
38 of different classes, derived from the base class line_cooker
39 Depending on the message content or the message_type element in
40 XML, one of these objects is selected.
42 Logrunner is integrated with gcm_input. Although its functionality
43 is still limited, a connection between logrunner and gcm_input
46 *****************************/
48 /* static const char *RCSID = "$Id: access_cooker.cpp,v 1.2 2003-12-04 10:38:09 arjen Exp $"; */
52 #include "access_cooker.h"
54 static const regex re_accesslog("(GET|POST|HEAD) .+ HTTP");
56 bool access_cooker::check_pattern(String logline)
58 return logline == re_accesslog;
61 bool access_cooker::cook_this(String logline, UTC arrival)
63 if (check_pattern(logline))
65 String datestring = logline(regex("\\[.+\\]"));
69 datestring[datestring.index(':')] = ' ';
71 date log_date = datestring;
72 hour log_time = datestring;
74 log_date = datestring;
75 log_time = datestring;
77 ts = UTC(log_date, log_time);