001 /** 002 * 003 * Licensed to the Apache Software Foundation (ASF) under one or more 004 * contributor license agreements. See the NOTICE file distributed with 005 * this work for additional information regarding copyright ownership. 006 * The ASF licenses this file to You under the Apache License, Version 2.0 007 * (the "License"); you may not use this file except in compliance with 008 * the License. You may obtain a copy of the License at 009 * 010 * http://www.apache.org/licenses/LICENSE-2.0 011 * 012 * Unless required by applicable law or agreed to in writing, software 013 * distributed under the License is distributed on an "AS IS" BASIS, 014 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 015 * See the License for the specific language governing permissions and 016 * limitations under the License. 017 */ 018 package org.apache.geronimo.jetty.requestlog; 019 020 import java.io.File; 021 import java.io.FilenameFilter; 022 import java.io.RandomAccessFile; 023 import java.nio.CharBuffer; 024 import java.nio.MappedByteBuffer; 025 import java.nio.channels.FileChannel; 026 import java.nio.charset.Charset; 027 import java.text.ParseException; 028 import java.text.SimpleDateFormat; 029 import java.util.ArrayList; 030 import java.util.Collection; 031 import java.util.Date; 032 import java.util.Iterator; 033 import java.util.LinkedList; 034 import java.util.List; 035 import java.util.regex.Matcher; 036 import java.util.regex.Pattern; 037 038 import org.apache.commons.logging.Log; 039 import org.apache.commons.logging.LogFactory; 040 import org.apache.geronimo.gbean.GBeanInfo; 041 import org.apache.geronimo.gbean.GBeanInfoBuilder; 042 import org.apache.geronimo.system.serverinfo.ServerInfo; 043 044 /** 045 * Jetty implementation of the WebAccessLog management interface. 046 * 047 * @version $Rev: 470597 $ $Date: 2006-11-02 15:30:55 -0800 (Thu, 02 Nov 2006) $ 048 */ 049 public class JettyLogManagerImpl implements JettyLogManager { 050 private final static Log log = LogFactory.getLog(JettyLogManagerImpl.class); 051 052 // Pattern that matches the date in the logfile name 053 private final static Pattern FILENAME_DATE_PATTERN = Pattern.compile("[-_ /.](((19|20)\\d\\d)[-_ /.](0[1-9]|1[012])[-_ /.](0[1-9]|[12][0-9]|3[01]))"); 054 private final static int GROUP_FILENAME_FULL_DATE = 1; 055 private final static int GROUP_FILENAME_YEAR = 2; 056 private final static int GROUP_FILENAME_MONTH = 4; 057 private final static int GROUP_FILENAME_DAY = 5; 058 // NOTE: The file separators are specified here rather than using something like File.separator because 059 // they are hard coded in config plans and sometimes in java code itself rather than being dependent 060 // upon the OS. This should be fixed someday, but for now we will manually check for either format. 061 private final static String FILE_SEPARATOR_UNIX_STYLE = "/"; 062 private final static String FILE_SEPARATOR_WIN_STYLE = "\\"; 063 064 // Pattern that matches a single line (used to calculate line numbers) 065 private final static Pattern FULL_LINE_PATTERN = Pattern.compile("^.*", Pattern.MULTILINE); 066 private final static Pattern ACCESS_LOG_PATTERN = Pattern.compile("(\\S*) (\\S*) (\\S*) \\[(.*)\\] \\\"(\\S*) (\\S*).*?\\\" (\\S*) (\\S*).*"); 067 private final static int GROUP_HOST = 1; 068 private final static int GROUP_USER = 3; 069 private final static int GROUP_DATE = 4; 070 private final static int GROUP_METHOD = 5; 071 private final static int GROUP_URI = 6; 072 private final static int GROUP_RESPONSE_CODE = 7; 073 private final static int GROUP_RESPONSE_LENGTH = 8; 074 private final static String ACCESS_LOG_DATE_FORMAT = "dd/MMM/yyyy:HH:mm:ss ZZZZ"; 075 private final static String LOG_FILE_NAME_FORMAT = "yyyy_MM_dd"; 076 private final Collection logGbeans; 077 private final ServerInfo serverInfo; 078 079 public JettyLogManagerImpl(ServerInfo serverInfo, Collection logGbeans) { 080 this.serverInfo = serverInfo; 081 this.logGbeans = logGbeans; 082 } 083 084 /** 085 * Gets the name of all logs used by this system. Typically there 086 * is only one, but specialized cases may use more. 087 * 088 * @return An array of all log names 089 * 090 */ 091 public String[] getLogNames() { 092 List logNames = new ArrayList(); 093 for (Iterator it = logGbeans.iterator(); it.hasNext();) { 094 JettyRequestLog jettyLog = (JettyRequestLog) it.next(); 095 if(jettyLog.getFilename() != null) { 096 logNames.add(jettyLog.getFilename()); 097 } 098 } 099 return (String[]) logNames.toArray(new String[logNames.size()]); 100 } 101 102 /** 103 * Gets the names of all log files for this log name. 104 * 105 * @param logName The name of the log for which to return the specific file names. 106 * 107 * @return An array of log file names 108 * 109 */ 110 public String[] getLogFileNames(String logName) { 111 List names = new ArrayList(); 112 113 // Find all the files for this logName 114 File[] logFiles = getLogFiles(logName); 115 116 if (logFiles !=null) { 117 for (int i = 0; i < logFiles.length; i++) { 118 names.add(logFiles[i].getName()); 119 } 120 } 121 return (String[]) names.toArray(new String[names.size()]); 122 } 123 124 /** 125 * Gets the name of all log files used by this log. Typically there 126 * is only one, but specialized cases may use more. 127 * 128 * @param logName The name of the log for which to return the specific files. 129 * 130 * @return An array of all log file names 131 * 132 */ 133 private File[] getLogFiles(String logName) { 134 File[] logFiles = null; 135 136 try { 137 String fileNamePattern = logName; 138 if (fileNamePattern.indexOf(FILE_SEPARATOR_UNIX_STYLE) > -1) { 139 fileNamePattern = fileNamePattern.substring(fileNamePattern.lastIndexOf(FILE_SEPARATOR_UNIX_STYLE) + 1); 140 } else if (fileNamePattern.indexOf(FILE_SEPARATOR_WIN_STYLE) > -1) { 141 fileNamePattern = fileNamePattern.substring(fileNamePattern.lastIndexOf(FILE_SEPARATOR_WIN_STYLE) + 1); 142 } 143 144 String logFile = serverInfo.resolvePath(logName); 145 146 File parent = new File(logFile).getParentFile(); 147 148 if (parent != null) { 149 logFiles = parent.listFiles(new PatternFilenameFilter(fileNamePattern)); 150 } 151 } catch (Exception e) { 152 log.error("Exception attempting to locate Jetty log files", e); 153 logFiles = new File[0]; 154 } 155 return logFiles; 156 } 157 158 /** 159 * Searches the log for records matching the specified parameters. The 160 * maximum results returned will be the lesser of 1000 and the 161 * provided maxResults argument. 162 * 163 * @see #MAX_SEARCH_RESULTS 164 */ 165 public SearchResults getMatchingItems(String logName, String host, String user, String method, String uri, Date startDate, 166 Date endDate, Integer skipResults, Integer maxResults) { 167 168 // Clean up the arguments so we know what we've really got 169 if(host != null && host.equals("")) host = null; 170 if(user != null && user.equals("")) user = null; 171 if(method != null && method.equals("")) method = null; 172 if(uri != null && uri.equals("")) uri = null; 173 174 long start = startDate == null ? 0 : startDate.getTime(); 175 long end = endDate == null ? 0 : endDate.getTime(); 176 177 List list = new LinkedList(); 178 boolean capped = false; 179 int lineCount = 0, fileCount = 0; 180 181 // Find all the files for this logName 182 File logFiles[] = getLogFiles(logName); 183 184 if (logFiles !=null) { 185 for (int i = 0; i < logFiles.length; i++) { 186 fileCount = 0; 187 try { 188 // Obtain the date for the current log file 189 String fileName = logFiles[i].getName(); 190 Matcher fileDate = FILENAME_DATE_PATTERN.matcher(fileName); 191 fileDate.find(); 192 SimpleDateFormat simpleFileDate = new SimpleDateFormat(LOG_FILE_NAME_FORMAT); 193 long logFileTime = simpleFileDate.parse(fileDate.group(GROUP_FILENAME_FULL_DATE)).getTime(); 194 195 // Check if the dates are null (ignore) or fall within the search range 196 if ( (start==0 && end==0) 197 || (start>0 && start<=logFileTime && end>0 && end>=logFileTime)) { 198 199 // It's in the range, so process the file 200 RandomAccessFile raf = new RandomAccessFile(logFiles[i], "r"); 201 FileChannel fc = raf.getChannel(); 202 MappedByteBuffer bb = fc.map(FileChannel.MapMode.READ_ONLY, 0, fc.size()); 203 CharBuffer cb = Charset.forName("US-ASCII").decode(bb); //todo: does Jetty use a different charset on a foreign PC? 204 Matcher lines = FULL_LINE_PATTERN.matcher(cb); 205 Matcher target = ACCESS_LOG_PATTERN.matcher(""); 206 SimpleDateFormat format = (start == 0 && end == 0) ? null : new SimpleDateFormat(ACCESS_LOG_DATE_FORMAT); 207 int max = maxResults == null ? MAX_SEARCH_RESULTS : Math.min(maxResults.intValue(), MAX_SEARCH_RESULTS); 208 209 while(lines.find()) { 210 ++lineCount; 211 ++fileCount; 212 if(capped) { 213 continue; 214 } 215 CharSequence line = cb.subSequence(lines.start(), lines.end()); 216 target.reset(line); 217 if(target.find()) { 218 if(host != null && !host.equals(target.group(GROUP_HOST))) { 219 continue; 220 } 221 if(user != null && !user.equals(target.group(GROUP_USER))) { 222 continue; 223 } 224 if(method != null && !method.equals(target.group(GROUP_METHOD))) { 225 continue; 226 } 227 if(uri != null && !target.group(GROUP_URI).startsWith(uri)) { 228 continue; 229 } 230 if(format != null) { 231 try { 232 long entry = format.parse(target.group(GROUP_DATE)).getTime(); 233 if(start > entry) { 234 continue; 235 } 236 if(end > 0 && end < entry) { 237 continue; 238 } 239 } catch (ParseException e) { 240 // can't read the date, guess this record counts. 241 } 242 } 243 if(skipResults != null && skipResults.intValue() > lineCount) { 244 continue; 245 } 246 if(list.size() > max) { 247 capped = true; 248 continue; 249 } 250 list.add(new LogMessage(fileCount,line.toString())); 251 } 252 } 253 fc.close(); 254 raf.close(); 255 } 256 } catch (Exception e) { 257 log.error("Unexpected error processing logs", e); 258 } 259 } 260 } 261 return new SearchResults(lineCount, (LogMessage[]) list.toArray(new LogMessage[list.size()]), capped); 262 } 263 264 265 public static final GBeanInfo GBEAN_INFO; 266 267 static { 268 GBeanInfoBuilder infoFactory = GBeanInfoBuilder.createStatic("Jetty Log Manager", JettyLogManagerImpl.class); 269 infoFactory.addReference("LogGBeans", JettyRequestLog.class); 270 infoFactory.addReference("ServerInfo", ServerInfo.class, "GBean"); 271 infoFactory.addInterface(JettyLogManager.class); 272 273 infoFactory.setConstructor(new String[]{"ServerInfo","LogGBeans"}); 274 GBEAN_INFO = infoFactory.getBeanInfo(); 275 } 276 277 public static GBeanInfo getGBeanInfo() { 278 return GBEAN_INFO; 279 } 280 281 /* 282 * Static inner class implementation of java.io.Filename. This will help us 283 * filter for only the files that we are interested in. 284 */ 285 static class PatternFilenameFilter implements FilenameFilter { 286 Pattern pattern; 287 //todo: put this pattern in a GBean parameter? 288 PatternFilenameFilter(String fileNamePattern) { 289 fileNamePattern = fileNamePattern.replaceAll("yyyy", "\\\\d{4}"); 290 fileNamePattern = fileNamePattern.replaceAll("yy", "\\\\d{2}"); 291 fileNamePattern = fileNamePattern.replaceAll("mm", "\\\\d{2}"); 292 fileNamePattern = fileNamePattern.replaceAll("dd", "\\\\d{2}"); 293 this.pattern = Pattern.compile(fileNamePattern); 294 } 295 296 public boolean accept(File file, String fileName) { 297 return pattern.matcher(fileName).matches(); 298 } 299 } 300 }