001 /* 002 * Licensed to the Apache Software Foundation (ASF) under one or more 003 * contributor license agreements. See the NOTICE file distributed with 004 * this work for additional information regarding copyright ownership. 005 * The ASF licenses this file to You under the Apache License, Version 2.0 006 * (the "License"); you may not use this file except in compliance with 007 * the License. You may obtain a copy of the License at 008 * 009 * http://www.apache.org/licenses/LICENSE-2.0 010 * 011 * Unless required by applicable law or agreed to in writing, software 012 * distributed under the License is distributed on an "AS IS" BASIS, 013 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 014 * See the License for the specific language governing permissions and 015 * limitations under the License. 016 */ 017 018 package org.apache.commons.codec.language; 019 020 import org.apache.commons.codec.EncoderException; 021 import org.apache.commons.codec.StringEncoderAbstractTest; 022 import org.junit.Test; 023 024 /** 025 * Tests the {@code ColognePhonetic} class. 026 * 027 * <p>Keep this file in UTF-8 encoding for proper Javadoc processing.</p> 028 * 029 */ 030 public class ColognePhoneticTest extends StringEncoderAbstractTest<ColognePhonetic> { 031 032 @Override 033 protected ColognePhonetic createStringEncoder() { 034 return new ColognePhonetic(); 035 } 036 037 @Test 038 public void testAabjoe() throws EncoderException { 039 this.checkEncoding("01", "Aabjoe"); 040 } 041 042 @Test 043 public void testAaclan() throws EncoderException { 044 this.checkEncoding("0856", "Aaclan"); 045 } 046 047 /** 048 * Tests [CODEC-122] 049 * 050 * @throws EncoderException 051 */ 052 @Test 053 public void testAychlmajrForCodec122() throws EncoderException { 054 this.checkEncoding("04567", "Aychlmajr"); 055 } 056 057 @Test 058 public void testEdgeCases() throws EncoderException { 059 final String[][] data = { 060 {"a", "0"}, 061 {"e", "0"}, 062 {"i", "0"}, 063 {"o", "0"}, 064 {"u", "0"}, 065 {"\u00E4", "0"}, // a-umlaut 066 {"\u00F6", "0"}, // o-umlaut 067 {"\u00FC", "0"}, // u-umlaut 068 {"aa", "0"}, 069 {"ha", "0"}, 070 {"h", ""}, 071 {"aha", "0"}, 072 {"b", "1"}, 073 {"p", "1"}, 074 {"ph", "3"}, 075 {"f", "3"}, 076 {"v", "3"}, 077 {"w", "3"}, 078 {"g", "4"}, 079 {"k", "4"}, 080 {"q", "4"}, 081 {"x", "48"}, 082 {"ax", "048"}, 083 {"cx", "48"}, 084 {"l", "5"}, 085 {"cl", "45"}, 086 {"acl", "085"}, 087 {"mn", "6"}, 088 {"r", "7"}}; 089 this.checkEncodings(data); 090 } 091 092 @Test 093 public void testExamples() throws EncoderException { 094 final String[][] data = { 095 {"m\u00DCller", "657"}, // mÜller - why upper case U-umlaut? 096 {"schmidt", "862"}, 097 {"schneider", "8627"}, 098 {"fischer", "387"}, 099 {"weber", "317"}, 100 {"wagner", "3467"}, 101 {"becker", "147"}, 102 {"hoffmann", "0366"}, 103 {"sch\u00C4fer", "837"}, // schÄfer - why upper case A-umlaut ? 104 {"Breschnew", "17863"}, 105 {"Wikipedia", "3412"}, 106 {"peter", "127"}, 107 {"pharma", "376"}, 108 {"m\u00f6nchengladbach", "664645214"}, // mönchengladbach 109 {"deutsch", "28"}, 110 {"deutz", "28"}, 111 {"hamburg", "06174"}, 112 {"hannover", "0637"}, 113 {"christstollen", "478256"}, 114 {"Xanthippe", "48621"}, 115 {"Zacharias", "8478"}, 116 {"Holzbau", "0581"}, 117 {"matsch", "68"}, 118 {"matz", "68"}, 119 {"Arbeitsamt", "071862"}, 120 {"Eberhard", "01772"}, 121 {"Eberhardt", "01772"}, 122 {"heithabu", "021"}}; 123 this.checkEncodings(data); 124 } 125 126 @Test 127 public void testHyphen() throws EncoderException { 128 final String[][] data = {{"bergisch-gladbach", "174845214"}, 129 {"M\u00fcller-L\u00fcdenscheidt", "65752682"}}; // Müller-Lüdenscheidt 130 this.checkEncodings(data); 131 } 132 133 @Test 134 public void testIsEncodeEquals() { 135 final String[][] data = { 136 {"Meyer", "M\u00fcller"}, // Müller 137 {"Meyer", "Mayr"}, 138 {"house", "house"}, 139 {"House", "house"}, 140 {"Haus", "house"}, 141 {"ganz", "Gans"}, 142 {"ganz", "G\u00e4nse"}, // Gänse 143 {"Miyagi", "Miyako"}}; 144 for (final String[] element : data) { 145 this.getStringEncoder().isEncodeEqual(element[1], element[0]); 146 } 147 } 148 149 @Test 150 public void testVariationsMella() throws EncoderException { 151 final String data[] = {"mella", "milah", "moulla", "mellah", "muehle", "mule"}; 152 this.checkEncodingVariations("65", data); 153 } 154 155 @Test 156 public void testVariationsMeyer() throws EncoderException { 157 final String data[] = {"Meier", "Maier", "Mair", "Meyer", "Meyr", "Mejer", "Major"}; 158 this.checkEncodingVariations("67", data); 159 } 160 }