您的位置:首页 > 运维架构 > Apache

解析Apache日志文件,正则表达式

2010-01-19 12:12 295 查看
解析Apache日志文件,正则表达式


/*

* Copyright (c) Ian F. Darwin, http://www.darwinsys.com/, 1996-2002.

* All rights reserved. Software written by Ian F. Darwin and others.

* $Id: LICENSE,v 1.8 2004/02/09 03:33:38 ian Exp $

*

* Redistribution and use in source and binary forms, with or without

* modification, are permitted provided that the following conditions

* are met:

* 1. Redistributions of source code must retain the above copyright

*    notice, this list of conditions and the following disclaimer.

* 2. Redistributions in binary form must reproduce the above copyright

*    notice, this list of conditions and the following disclaimer in the

*    documentation and/or other materials provided with the distribution.

*

* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS''

* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED

* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR

* PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS

* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

* POSSIBILITY OF SUCH DAMAGE.

*

* Java, the Duke mascot, and all variants of Sun's Java "steaming coffee

* cup" logo are trademarks of Sun Microsystems. Sun's, and James Gosling's,

* pioneering role in inventing and promulgating (and standardizing) the Java

* language and environment is gratefully acknowledged.

*

* The pioneering role of Dennis Ritchie and Bjarne Stroustrup, of AT&T, for

* inventing predecessor languages C and C++ is also gratefully acknowledged.

*/

import 

java.util.regex.*;

/**

* Common fields for Apache Log demo.

*/

interface 

LogExample
{

/** The number of fields that must be found. */

public static final 

int 

NUM_FIELDS =
9
;

/** The sample log entry to be parsed. */

public static final 

String logEntryLine =
"123.45.67.89 - - [27/Oct/2000:09:27:09 -0400] /"GET /java/javaResources.html HTTP/1.0/" 200 10450 /"-/" /"Mozilla/4.6 [en] (X11; U; OpenBSD 2.8 i386; Nav)/""
;

}

/**

* Parse an Apache log file with Regular Expressions

*/

public class 

LogRegExp
implements 

LogExample
{

public static 

void 

main
(
String argv
[]) {

String logEntryPattern =
"^([//d.]+) (//S+) (//S+) //[([//w:/]+//s[+//-]//d{4})//] /"(.+?)/" (//d{3}) (//d+) /"([^/"]+)/" /"([^/"]+)/""
;

System.out.println
(
"Using RE Pattern:"
)
;

System.out.println
(
logEntryPattern
)
;

System.out.println
(
"Input line is:"
)
;

System.out.println
(
logEntryLine
)
;

Pattern p = Pattern.compile
(
logEntryPattern
)
;

Matcher matcher = p.matcher
(
logEntryLine
)
;

if 

(
!matcher.matches
()
||

NUM_FIELDS != matcher.groupCount
()) {

System.err.println
(
"Bad log entry (or problem with RE?):"
)
;

System.err.println
(
logEntryLine
)
;

return

;

}

System.out.println
(
"IP Address: "
+ matcher.group
(
1
))
;

System.out.println
(
"Date&Time: "
+ matcher.group
(
4
))
;

System.out.println
(
"Request: "
+ matcher.group
(
5
))
;

System.out.println
(
"Response: "
+ matcher.group
(
6
))
;

System.out.println
(
"Bytes Sent: "
+ matcher.group
(
7
))
;

if 

(
!matcher.group
(
8
)
.equals
(
"-"
))

System.out.println
(
"Referer: "
+ matcher.group
(
8
))
;

System.out.println
(
"Browser: "
+ matcher.group
(
9
))
;

}

}


内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: