CharRange.java

  1. /*
  2.  * Licensed to the Apache Software Foundation (ASF) under one or more
  3.  * contributor license agreements.  See the NOTICE file distributed with
  4.  * this work for additional information regarding copyright ownership.
  5.  * The ASF licenses this file to You under the Apache License, Version 2.0
  6.  * (the "License"); you may not use this file except in compliance with
  7.  * the License.  You may obtain a copy of the License at
  8.  *
  9.  *      http://www.apache.org/licenses/LICENSE-2.0
  10.  *
  11.  * Unless required by applicable law or agreed to in writing, software
  12.  * distributed under the License is distributed on an "AS IS" BASIS,
  13.  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14.  * See the License for the specific language governing permissions and
  15.  * limitations under the License.
  16.  */
  17. package org.apache.commons.lang3;

  18. import java.io.Serializable;
  19. import java.util.Iterator;
  20. import java.util.NoSuchElementException;
  21. import java.util.Objects;

  22. /**
  23.  * A contiguous range of characters, optionally negated.
  24.  *
  25.  * <p>Instances are immutable.</p>
  26.  *
  27.  * <p>#ThreadSafe#</p>
  28.  * @since 1.0
  29.  */
  30. // TODO: This is no longer public and will be removed later as CharSet is moved
  31. // to depend on Range.
  32. final class CharRange implements Iterable<Character>, Serializable {

  33.     /**
  34.      * Character {@link Iterator}.
  35.      * <p>#NotThreadSafe#</p>
  36.      */
  37.     private static final class CharacterIterator implements Iterator<Character> {
  38.         /** The current character */
  39.         private char current;

  40.         private final CharRange range;
  41.         private boolean hasNext;

  42.         /**
  43.          * Constructs a new iterator for the character range.
  44.          *
  45.          * @param r The character range
  46.          */
  47.         private CharacterIterator(final CharRange r) {
  48.             range = r;
  49.             hasNext = true;

  50.             if (range.negated) {
  51.                 if (range.start == 0) {
  52.                     if (range.end == Character.MAX_VALUE) {
  53.                         // This range is an empty set
  54.                         hasNext = false;
  55.                     } else {
  56.                         current = (char) (range.end + 1);
  57.                     }
  58.                 } else {
  59.                     current = 0;
  60.                 }
  61.             } else {
  62.                 current = range.start;
  63.             }
  64.         }

  65.         /**
  66.          * Has the iterator not reached the end character yet?
  67.          *
  68.          * @return {@code true} if the iterator has yet to reach the character date
  69.          */
  70.         @Override
  71.         public boolean hasNext() {
  72.             return hasNext;
  73.         }

  74.         /**
  75.          * Returns the next character in the iteration
  76.          *
  77.          * @return {@link Character} for the next character
  78.          */
  79.         @Override
  80.         public Character next() {
  81.             if (!hasNext) {
  82.                 throw new NoSuchElementException();
  83.             }
  84.             final char cur = current;
  85.             prepareNext();
  86.             return Character.valueOf(cur);
  87.         }

  88.         /**
  89.          * Prepares the next character in the range.
  90.          */
  91.         private void prepareNext() {
  92.             if (range.negated) {
  93.                 if (current == Character.MAX_VALUE) {
  94.                     hasNext = false;
  95.                 } else if (current + 1 == range.start) {
  96.                     if (range.end == Character.MAX_VALUE) {
  97.                         hasNext = false;
  98.                     } else {
  99.                         current = (char) (range.end + 1);
  100.                     }
  101.                 } else {
  102.                     current = (char) (current + 1);
  103.                 }
  104.             } else if (current < range.end) {
  105.                 current = (char) (current + 1);
  106.             } else {
  107.                 hasNext = false;
  108.             }
  109.         }

  110.         /**
  111.          * Always throws UnsupportedOperationException.
  112.          *
  113.          * @throws UnsupportedOperationException Always thrown.
  114.          * @see java.util.Iterator#remove()
  115.          */
  116.         @Override
  117.         public void remove() {
  118.             throw new UnsupportedOperationException();
  119.         }
  120.     }

  121.     /**
  122.      * Required for serialization support. Lang version 2.0.
  123.      *
  124.      * @see java.io.Serializable
  125.      */
  126.     private static final long serialVersionUID = 8270183163158333422L;

  127.     /** Empty array. */
  128.     static final CharRange[] EMPTY_ARRAY = {};

  129.     /**
  130.      * Constructs a {@link CharRange} over a single character.
  131.      *
  132.      * @param ch  only character in this range
  133.      * @return the new CharRange object
  134.      * @since 2.5
  135.      */
  136.     public static CharRange is(final char ch) {
  137.         return new CharRange(ch, ch, false);
  138.     }

  139.     /**
  140.      * Constructs a {@link CharRange} over a set of characters.
  141.      *
  142.      * <p>If start and end are in the wrong order, they are reversed.
  143.      * Thus {@code a-e} is the same as {@code e-a}.</p>
  144.      *
  145.      * @param start  first character, inclusive, in this range
  146.      * @param end  last character, inclusive, in this range
  147.      * @return the new CharRange object
  148.      * @since 2.5
  149.      */
  150.     public static CharRange isIn(final char start, final char end) {
  151.         return new CharRange(start, end, false);
  152.     }

  153.     /**
  154.      * Constructs a negated {@link CharRange} over a single character.
  155.      *
  156.      * <p>A negated range includes everything except that defined by the
  157.      * single character.</p>
  158.      *
  159.      * @param ch  only character in this range
  160.      * @return the new CharRange object
  161.      * @since 2.5
  162.      */
  163.     public static CharRange isNot(final char ch) {
  164.         return new CharRange(ch, ch, true);
  165.     }

  166.     /**
  167.      * Constructs a negated {@link CharRange} over a set of characters.
  168.      *
  169.      * <p>A negated range includes everything except that defined by the
  170.      * start and end characters.</p>
  171.      *
  172.      * <p>If start and end are in the wrong order, they are reversed.
  173.      * Thus {@code a-e} is the same as {@code e-a}.</p>
  174.      *
  175.      * @param start  first character, inclusive, in this range
  176.      * @param end  last character, inclusive, in this range
  177.      * @return the new CharRange object
  178.      * @since 2.5
  179.      */
  180.     public static CharRange isNotIn(final char start, final char end) {
  181.         return new CharRange(start, end, true);
  182.     }

  183.     /** The first character, inclusive, in the range. */
  184.     private final char start;

  185.     /** The last character, inclusive, in the range. */
  186.     private final char end;

  187.     /** True if the range is everything except the characters specified. */
  188.     private final boolean negated;

  189.     /** Cached toString. */
  190.     private transient String iToString;

  191.     /**
  192.      * Constructs a {@link CharRange} over a set of characters,
  193.      * optionally negating the range.
  194.      *
  195.      * <p>A negated range includes everything except that defined by the
  196.      * start and end characters.</p>
  197.      *
  198.      * <p>If start and end are in the wrong order, they are reversed.
  199.      * Thus {@code a-e} is the same as {@code e-a}.</p>
  200.      *
  201.      * @param start  first character, inclusive, in this range
  202.      * @param end  last character, inclusive, in this range
  203.      * @param negated  true to express everything except the range
  204.      */
  205.     private CharRange(char start, char end, final boolean negated) {
  206.         if (start > end) {
  207.             final char temp = start;
  208.             start = end;
  209.             end = temp;
  210.         }

  211.         this.start = start;
  212.         this.end = end;
  213.         this.negated = negated;
  214.     }

  215.     // Contains
  216.     /**
  217.      * Is the character specified contained in this range.
  218.      *
  219.      * @param ch  the character to check
  220.      * @return {@code true} if this range contains the input character
  221.      */
  222.     public boolean contains(final char ch) {
  223.         return (ch >= start && ch <= end) != negated;
  224.     }

  225.     /**
  226.      * Are all the characters of the passed in range contained in
  227.      * this range.
  228.      *
  229.      * @param range  the range to check against
  230.      * @return {@code true} if this range entirely contains the input range
  231.      * @throws NullPointerException if {@code null} input
  232.      */
  233.     public boolean contains(final CharRange range) {
  234.         Objects.requireNonNull(range, "range");
  235.         if (negated) {
  236.             if (range.negated) {
  237.                 return start >= range.start && end <= range.end;
  238.             }
  239.             return range.end < start || range.start > end;
  240.         }
  241.         if (range.negated) {
  242.             return start == 0 && end == Character.MAX_VALUE;
  243.         }
  244.         return start <= range.start && end >= range.end;
  245.     }

  246.     // Basics
  247.     /**
  248.      * Compares two CharRange objects, returning true if they represent
  249.      * exactly the same range of characters defined in the same way.
  250.      *
  251.      * @param obj  the object to compare to
  252.      * @return true if equal
  253.      */
  254.     @Override
  255.     public boolean equals(final Object obj) {
  256.         if (obj == this) {
  257.             return true;
  258.         }
  259.         if (!(obj instanceof CharRange)) {
  260.             return false;
  261.         }
  262.         final CharRange other = (CharRange) obj;
  263.         return start == other.start && end == other.end && negated == other.negated;
  264.     }

  265.     /**
  266.      * Gets the end character for this character range.
  267.      *
  268.      * @return the end char (inclusive)
  269.      */
  270.     public char getEnd() {
  271.         return this.end;
  272.     }

  273.     // Accessors
  274.     /**
  275.      * Gets the start character for this character range.
  276.      *
  277.      * @return the start char (inclusive)
  278.      */
  279.     public char getStart() {
  280.         return this.start;
  281.     }

  282.     /**
  283.      * Gets a hashCode compatible with the equals method.
  284.      *
  285.      * @return a suitable hashCode
  286.      */
  287.     @Override
  288.     public int hashCode() {
  289.         return 83 + start + 7 * end + (negated ? 1 : 0);
  290.     }

  291.     /**
  292.      * Is this {@link CharRange} negated.
  293.      *
  294.      * <p>A negated range includes everything except that defined by the
  295.      * start and end characters.</p>
  296.      *
  297.      * @return {@code true} if negated
  298.      */
  299.     public boolean isNegated() {
  300.         return negated;
  301.     }

  302.     /**
  303.      * Returns an iterator which can be used to walk through the characters described by this range.
  304.      *
  305.      * <p>#NotThreadSafe# the iterator is not thread-safe</p>
  306.      * @return an iterator to the chars represented by this range
  307.      * @since 2.5
  308.      */
  309.     @Override
  310.     public Iterator<Character> iterator() {
  311.         return new CharacterIterator(this);
  312.     }

  313.     /**
  314.      * Gets a string representation of the character range.
  315.      *
  316.      * @return string representation of this range
  317.      */
  318.     @Override
  319.     public String toString() {
  320.         if (iToString == null) {
  321.             final StringBuilder buf = new StringBuilder(4);
  322.             if (isNegated()) {
  323.                 buf.append('^');
  324.             }
  325.             buf.append(start);
  326.             if (start != end) {
  327.                 buf.append('-');
  328.                 buf.append(end);
  329.             }
  330.             iToString = buf.toString();
  331.         }
  332.         return iToString;
  333.     }
  334. }