JaccardDistance.java

  1. /*
  2.  * Licensed to the Apache Software Foundation (ASF) under one or more
  3.  * contributor license agreements.  See the NOTICE file distributed with
  4.  * this work for additional information regarding copyright ownership.
  5.  * The ASF licenses this file to You under the Apache License, Version 2.0
  6.  * (the "License"); you may not use this file except in compliance with
  7.  * the License.  You may obtain a copy of the License at
  8.  *
  9.  *      http://www.apache.org/licenses/LICENSE-2.0
  10.  *
  11.  * Unless required by applicable law or agreed to in writing, software
  12.  * distributed under the License is distributed on an "AS IS" BASIS,
  13.  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14.  * See the License for the specific language governing permissions and
  15.  * limitations under the License.
  16.  */
  17. package org.apache.commons.text.similarity;

  18. /**
  19.  * Measures the Jaccard distance of two sets of character sequence. Jaccard
  20.  * distance is the dissimilarity between two sets. Its the complementary of
  21.  * Jaccard similarity.
  22.  *
  23.  * <p>
  24.  * For further explanation about Jaccard Distance, refer
  25.  * https://en.wikipedia.org/wiki/Jaccard_index
  26.  * </p>
  27.  *
  28.  * @since 1.0
  29.  */
  30. public class JaccardDistance implements EditDistance<Double> {

  31.     private final JaccardSimilarity jaccardSimilarity = new JaccardSimilarity();

  32.     /**
  33.      * Calculates Jaccard distance of two set character sequence passed as
  34.      * input. Calculates Jaccard similarity and returns the complement of it.
  35.      *
  36.      * @param left first character sequence
  37.      * @param right second character sequence
  38.      * @return index
  39.      * @throws IllegalArgumentException
  40.      *             if either String input {@code null}
  41.      */
  42.     @Override
  43.     public Double apply(CharSequence left, CharSequence right) {
  44.         if (left == null || right == null) {
  45.             throw new IllegalArgumentException("Input cannot be null");
  46.         }
  47.         return Math.round((1 - jaccardSimilarity.apply(left, right)) * 100d) / 100d;
  48.     }
  49. }