001    /* $Id: SimpleRegexMatcher.java 992060 2010-09-02 19:09:47Z simonetripodi $
002     *
003     * Licensed to the Apache Software Foundation (ASF) under one or more
004     * contributor license agreements.  See the NOTICE file distributed with
005     * this work for additional information regarding copyright ownership.
006     * The ASF licenses this file to You under the Apache License, Version 2.0
007     * (the "License"); you may not use this file except in compliance with
008     * the License.  You may obtain a copy of the License at
009     *
010     *      http://www.apache.org/licenses/LICENSE-2.0
011     *
012     * Unless required by applicable law or agreed to in writing, software
013     * distributed under the License is distributed on an "AS IS" BASIS,
014     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
015     * See the License for the specific language governing permissions and
016     * limitations under the License.
017     */
018    
019    package org.apache.commons.digester;
020    
021    import org.apache.commons.logging.Log;
022    import org.apache.commons.logging.LogFactory;
023    
024    /**
025     * <p>Simple regex pattern matching algorithm.</p>
026     * 
027     * <p>This uses just two wildcards:
028     * <ul>
029     *  <li><code>*</code> matches any sequence of none, one or more characters
030     *  <li><code>?</code> matches any one character 
031     * </ul>
032     * Escaping these wildcards is not supported .</p>
033     *
034     * @since 1.5
035     */
036    
037    public class SimpleRegexMatcher extends RegexMatcher {
038        
039        // --------------------------------------------------------- Fields
040        
041        /** Default log (class wide) */
042        private static final Log baseLog = LogFactory.getLog(SimpleRegexMatcher.class);
043        
044        /** Custom log (can be set per object) */
045        private Log log = baseLog;
046        
047        // --------------------------------------------------------- Properties
048        
049        /** 
050         * Gets the <code>Log</code> implementation.
051         */
052        public Log getLog() {
053            return log;
054        }
055        
056        /**
057         * Sets the current <code>Log</code> implementation used by this class.
058         */
059        public void setLog(Log log) {
060            this.log = log;
061        }
062        
063        // --------------------------------------------------------- Public Methods
064        
065        /** 
066         * Matches using simple regex algorithm.
067         * 
068         *
069         * @param basePattern the standard digester path representing the element
070         * @param regexPattern the regex pattern the path will be tested against
071         * @return true if the given pattern matches the given path
072         */
073        @Override
074        public boolean match(String basePattern, String regexPattern) {
075            // check for nulls
076            if (basePattern == null || regexPattern == null) {
077                return false;
078            }
079            return match(basePattern, regexPattern, 0, 0);
080        }
081        
082        // --------------------------------------------------------- Implementations Methods
083        
084        /**
085         * Implementation of regex matching algorithm.
086         * This calls itself recursively.
087         */
088        private boolean match(String basePattern, String regexPattern, int baseAt, int regexAt) {
089            if (log.isTraceEnabled()) {
090                log.trace("Base: " + basePattern);
091                log.trace("Regex: " + regexPattern);
092                log.trace("Base@" + baseAt);
093                log.trace("Regex@" + regexAt);
094            }
095            
096            // check bounds
097            if (regexAt >= regexPattern.length()) {
098                // maybe we've got a match
099                if (baseAt >= basePattern.length()) {
100                    // ok!
101                    return true;
102                }
103                // run out early
104                return false;
105                
106            } else {
107                if (baseAt >= basePattern.length()) {
108                    // run out early
109                    return false;
110                }
111            }
112            
113            // ok both within bounds
114            char regexCurrent = regexPattern.charAt(regexAt);
115            switch (regexCurrent) {
116                case '*':
117                    // this is the tricky case
118                    // check for terminal 
119                    if (++regexAt >= regexPattern.length()) {
120                        // this matches anything let - so return true
121                        return true;
122                    }
123                    // go through every subsequent apperance of the next character
124                    // and so if the rest of the regex matches
125                    char nextRegex = regexPattern.charAt(regexAt);
126                    if (log.isTraceEnabled()) {
127                        log.trace("Searching for next '" + nextRegex + "' char");
128                    }
129                    int nextMatch = basePattern.indexOf(nextRegex, baseAt);
130                    while (nextMatch != -1) {
131                        if (log.isTraceEnabled()) {
132                            log.trace("Trying '*' match@" + nextMatch);
133                        }
134                        if (match(basePattern, regexPattern, nextMatch, regexAt)) {
135                            return true;
136                        }
137                        nextMatch = basePattern.indexOf(nextRegex, nextMatch + 1);
138                    }
139                    log.trace("No matches found.");
140                    return false;
141                    
142                case '?':
143                    // this matches anything
144                    return match(basePattern, regexPattern, ++baseAt, ++regexAt);
145                
146                default:
147                    if (log.isTraceEnabled()) {
148                        log.trace("Camparing " + regexCurrent + " to " + basePattern.charAt(baseAt));
149                    }
150                    if (regexCurrent == basePattern.charAt(baseAt)) {
151                        // still got more to go
152                        return match(basePattern, regexPattern, ++baseAt, ++regexAt);
153                    }
154                    return false;
155            }
156        }
157    }