001 /* $Id: SimpleRegexMatcher.java 992060 2010-09-02 19:09:47Z simonetripodi $ 002 * 003 * Licensed to the Apache Software Foundation (ASF) under one or more 004 * contributor license agreements. See the NOTICE file distributed with 005 * this work for additional information regarding copyright ownership. 006 * The ASF licenses this file to You under the Apache License, Version 2.0 007 * (the "License"); you may not use this file except in compliance with 008 * the License. You may obtain a copy of the License at 009 * 010 * http://www.apache.org/licenses/LICENSE-2.0 011 * 012 * Unless required by applicable law or agreed to in writing, software 013 * distributed under the License is distributed on an "AS IS" BASIS, 014 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 015 * See the License for the specific language governing permissions and 016 * limitations under the License. 017 */ 018 019 package org.apache.commons.digester; 020 021 import org.apache.commons.logging.Log; 022 import org.apache.commons.logging.LogFactory; 023 024 /** 025 * <p>Simple regex pattern matching algorithm.</p> 026 * 027 * <p>This uses just two wildcards: 028 * <ul> 029 * <li><code>*</code> matches any sequence of none, one or more characters 030 * <li><code>?</code> matches any one character 031 * </ul> 032 * Escaping these wildcards is not supported .</p> 033 * 034 * @since 1.5 035 */ 036 037 public class SimpleRegexMatcher extends RegexMatcher { 038 039 // --------------------------------------------------------- Fields 040 041 /** Default log (class wide) */ 042 private static final Log baseLog = LogFactory.getLog(SimpleRegexMatcher.class); 043 044 /** Custom log (can be set per object) */ 045 private Log log = baseLog; 046 047 // --------------------------------------------------------- Properties 048 049 /** 050 * Gets the <code>Log</code> implementation. 051 */ 052 public Log getLog() { 053 return log; 054 } 055 056 /** 057 * Sets the current <code>Log</code> implementation used by this class. 058 */ 059 public void setLog(Log log) { 060 this.log = log; 061 } 062 063 // --------------------------------------------------------- Public Methods 064 065 /** 066 * Matches using simple regex algorithm. 067 * 068 * 069 * @param basePattern the standard digester path representing the element 070 * @param regexPattern the regex pattern the path will be tested against 071 * @return true if the given pattern matches the given path 072 */ 073 @Override 074 public boolean match(String basePattern, String regexPattern) { 075 // check for nulls 076 if (basePattern == null || regexPattern == null) { 077 return false; 078 } 079 return match(basePattern, regexPattern, 0, 0); 080 } 081 082 // --------------------------------------------------------- Implementations Methods 083 084 /** 085 * Implementation of regex matching algorithm. 086 * This calls itself recursively. 087 */ 088 private boolean match(String basePattern, String regexPattern, int baseAt, int regexAt) { 089 if (log.isTraceEnabled()) { 090 log.trace("Base: " + basePattern); 091 log.trace("Regex: " + regexPattern); 092 log.trace("Base@" + baseAt); 093 log.trace("Regex@" + regexAt); 094 } 095 096 // check bounds 097 if (regexAt >= regexPattern.length()) { 098 // maybe we've got a match 099 if (baseAt >= basePattern.length()) { 100 // ok! 101 return true; 102 } 103 // run out early 104 return false; 105 106 } else { 107 if (baseAt >= basePattern.length()) { 108 // run out early 109 return false; 110 } 111 } 112 113 // ok both within bounds 114 char regexCurrent = regexPattern.charAt(regexAt); 115 switch (regexCurrent) { 116 case '*': 117 // this is the tricky case 118 // check for terminal 119 if (++regexAt >= regexPattern.length()) { 120 // this matches anything let - so return true 121 return true; 122 } 123 // go through every subsequent apperance of the next character 124 // and so if the rest of the regex matches 125 char nextRegex = regexPattern.charAt(regexAt); 126 if (log.isTraceEnabled()) { 127 log.trace("Searching for next '" + nextRegex + "' char"); 128 } 129 int nextMatch = basePattern.indexOf(nextRegex, baseAt); 130 while (nextMatch != -1) { 131 if (log.isTraceEnabled()) { 132 log.trace("Trying '*' match@" + nextMatch); 133 } 134 if (match(basePattern, regexPattern, nextMatch, regexAt)) { 135 return true; 136 } 137 nextMatch = basePattern.indexOf(nextRegex, nextMatch + 1); 138 } 139 log.trace("No matches found."); 140 return false; 141 142 case '?': 143 // this matches anything 144 return match(basePattern, regexPattern, ++baseAt, ++regexAt); 145 146 default: 147 if (log.isTraceEnabled()) { 148 log.trace("Camparing " + regexCurrent + " to " + basePattern.charAt(baseAt)); 149 } 150 if (regexCurrent == basePattern.charAt(baseAt)) { 151 // still got more to go 152 return match(basePattern, regexPattern, ++baseAt, ++regexAt); 153 } 154 return false; 155 } 156 } 157 }