/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ //ASHKENAZIC // CONVERTING FEMININE TO MASCULINE "yna" "" "$" "(in[russian]|ina)" "ina" "" "$" "(in[russian]|ina)" "liova" "" "$" "(lof[russian]|lef[russian]|lova)" "lova" "" "$" "(lof[russian]|lef[russian]|lova)" "ova" "" "$" "(of[russian]|ova)" "eva" "" "$" "(ef[russian]|eva)" "aia" "" "$" "(aja|i[russian])" "aja" "" "$" "(aja|i[russian])" "aya" "" "$" "(aja|i[russian])" "lowa" "" "$" "(lova|lof[polish]|l[polish]|el[polish])" "kowa" "" "$" "(kova|kof[polish]|k[polish]|ek[polish])" "owa" "" "$" "(ova|of[polish]|)" "lowna" "" "$" "(lovna|levna|l[polish]|el[polish])" "kowna" "" "$" "(kovna|k[polish]|ek[polish])" "owna" "" "$" "(ovna|[polish])" "lówna" "" "$" "(l|el[polish])" // polish "kówna" "" "$" "(k|ek[polish])" // polish "ówna" "" "$" "" // polish "a" "" "$" "(a|i[polish])" // CONSONANTS (integrated: German, Polish, Russian, Romanian and English) "rh" "^" "" "r" "ssch" "" "" "S" "chsch" "" "" "xS" "tsch" "" "" "tS" "sch" "" "[ei]" "(sk[romanian]|S|StS[russian])" // german "sch" "" "" "(S|StS[russian])" // german "ssh" "" "" "S" "sh" "" "[äöü]" "sh" // german "sh" "" "[aeiou]" "(S[russian+english]|sh)" "sh" "" "" "S" // russian+english "kh" "" "" "(x[russian+english]|kh)" "chs" "" "" "(ks[german]|xs|tSs[russian+english])" // French "ch" is currently disabled //array("ch" "" "[ei]" "(x|tS|k[romanian]|S[french])" //array("ch" "" "" "(x|tS[russian+english]|S[french])" "ch" "" "[ei]" "(x|k[romanian]|tS[russian+english])" "ch" "" "" "(x|tS[russian+english])" "ck" "" "" "(k|tsk[polish])" "czy" "" "" "tSi" "cze" "" "[bcdgkpstwzż]" "(tSe|tSF)" "ciewicz" "" "" "(tsevitS|tSevitS)" "siewicz" "" "" "(sevitS|SevitS)" "ziewicz" "" "" "(zevitS|ZevitS)" "riewicz" "" "" "rjevitS" "diewicz" "" "" "djevitS" "tiewicz" "" "" "tjevitS" "iewicz" "" "" "evitS" "ewicz" "" "" "evitS" "owicz" "" "" "ovitS" "icz" "" "" "itS" "cz" "" "" "tS" // Polish "cia" "" "[bcdgkpstwzż]" "(tSB[polish]|tsB)" "cia" "" "" "(tSa[polish]|tsa)" "cią" "" "[bp]" "(tSom[polish]|tsom)" "cią" "" "" "(tSon[polish]|tson)" "cię" "" "[bp]" "(tSem[polish]|tsem)" "cię" "" "" "(tSen[polish]|tsen)" "cie" "" "[bcdgkpstwzż]" "(tSF[polish]|tsF)" "cie" "" "" "(tSe[polish]|tse)" "cio" "" "" "(tSo[polish]|tso)" "ciu" "" "" "(tSu[polish]|tsu)" "ci" "" "$" "(tsi[polish]|tSi[polish+romanian]|tS[romanian]|si)" "ci" "" "" "(tsi[polish]|tSi[polish+romanian]|si)" "ce" "" "[bcdgkpstwzż]" "(tsF[polish]|tSe[polish+romanian]|se)" "ce" "" "" "(tSe[polish+romanian]|tse[polish]|se)" "cy" "" "" "(si|tsi[polish])" "ssz" "" "" "S" // Polish "sz" "" "" "S" // Polish; actually could also be Hungarian /s/, disabled here "ssp" "" "" "(Sp[german]|sp)" "sp" "" "" "(Sp[german]|sp)" "sst" "" "" "(St[german]|st)" "st" "" "" "(St[german]|st)" "ss" "" "" "s" "sia" "" "[bcdgkpstwzż]" "(SB[polish]|sB[polish]|sja)" "sia" "" "" "(Sa[polish]|sja)" "sią" "" "[bp]" "(Som[polish]|som)" "sią" "" "" "(Son[polish]|son)" "się" "" "[bp]" "(Sem[polish]|sem)" "się" "" "" "(Sen[polish]|sen)" "sie" "" "[bcdgkpstwzż]" "(SF[polish]|sF|zi[german])" "sie" "" "" "(se|Se[polish]|zi[german])" "sio" "" "" "(So[polish]|so)" "siu" "" "" "(Su[polish]|sju)" "si" "" "" "(Si[polish]|si|zi[german])" "s" "" "[aeiouäöë]" "(s|z[german])" "gue" "" "" "ge" "gui" "" "" "gi" "guy" "" "" "gi" "gh" "" "[ei]" "(g[romanian]|gh)" "gauz" "" "$" "haus" "gaus" "" "$" "haus" "gol'ts" "" "$" "holts" "golts" "" "$" "holts" "gol'tz" "" "$" "holts" "goltz" "" "" "holts" "gol'ts" "^" "" "holts" "golts" "^" "" "holts" "gol'tz" "^" "" "holts" "goltz" "^" "" "holts" "gendler" "" "$" "hendler" "gejmer" "" "$" "hajmer" "gejm" "" "$" "hajm" "geymer" "" "$" "hajmer" "geym" "" "$" "hajm" "geimer" "" "$" "hajmer" "geim" "" "$" "hajm" "gof" "" "$" "hof" "ger" "" "$" "ger" "gen" "" "$" "gen" "gin" "" "$" "gin" "gie" "" "$" "(ge|gi[german]|ji[french])" "gie" "" "" "ge" "ge" "[yaeiou]" "" "(gE|xe[spanish]|dZe[english+romanian])" "gi" "[yaeiou]" "" "(gI|xi[spanish]|dZi[english+romanian])" "ge" "" "" "(gE|dZe[english+romanian]|hE[russian]|xe[spanish])" "gi" "" "" "(gI|dZi[english+romanian]|hI[russian]|xi[spanish])" "gy" "" "[aeouáéóúüöőű]" "(gi|dj[hungarian])" "gy" "" "" "(gi|d[hungarian])" "g" "[jyaeiou]" "[aouyei]" "g" "g" "" "[aouei]" "(g|h[russian])" "ej" "" "" "(aj|eZ[french+romanian]|ex[spanish])" "ej" "" "" "aj" "ly" "" "[au]" "l" "li" "" "[au]" "l" "lj" "" "[au]" "l" "lio" "" "" "(lo|le[russian])" "lyo" "" "" "(lo|le[russian])" "ll" "" "" "(l|J[spanish])" "j" "" "[aoeiuy]" "(j|dZ[english]|x[spanish]|Z[french+romanian])" "j" "" "" "(j|x[spanish])" "pf" "" "" "(pf|p|f)" "ph" "" "" "(ph|f)" "qu" "" "" "(kv[german]|k)" "rze" "t" "" "(Se[polish]|re)" // polish "rze" "" "" "(rze|rtsE[german]|Ze[polish]|re[polish]|rZe[polish])" "rzy" "t" "" "(Si[polish]|ri)" // polish "rzy" "" "" "(Zi[polish]|ri[polish]|rZi)" "rz" "t" "" "(S[polish]|r)" // polish "rz" "" "" "(rz|rts[german]|Z[polish]|r[polish]|rZ[polish])" // polish "tz" "" "$" "(ts|tS[english+german])" "tz" "^" "" "(ts|tS[english+german])" "tz" "" "" "(ts[english+german+russian]|tz)" "zh" "" "" "(Z|zh[polish]|tsh[german])" "zia" "" "[bcdgkpstwzż]" "(ZB[polish]|zB[polish]|zja)" "zia" "" "" "(Za[polish]|zja)" "zią" "" "[bp]" "(Zom[polish]|zom)" "zią" "" "" "(Zon[polish]|zon)" "zię" "" "[bp]" "(Zem[polish]|zem)" "zię" "" "" "(Zen[polish]|zen)" "zie" "" "[bcdgkpstwzż]" "(ZF[polish]|zF[polish]|ze|tsi[german])" "zie" "" "" "(ze|Ze[polish]|tsi[german])" "zio" "" "" "(Zo[polish]|zo)" "ziu" "" "" "(Zu[polish]|zju)" "zi" "" "" "(Zi[polish]|zi|tsi[german])" "thal" "" "$" "tal" "th" "^" "" "t" "th" "" "[aeiou]" "(t[german]|th)" "th" "" "" "t" // german "vogel" "" "" "(vogel|fogel[german])" "v" "^" "" "(v|f[german])" "h" "[aeiouyäöü]" "" "" //german "h" "" "" "(h|x[romanian+polish])" "h" "^" "" "(h|H[english+german])" // H can be exact "h" or approximate "kh" // VOWELS "yi" "^" "" "i" //"e" "" "$" "(e|)" // French & English rule disabled except for final -ine "e" "in" "$" "(e|[french])" "ii" "" "$" "i" // russian "iy" "" "$" "i" // russian "yy" "" "$" "i" // russian "yi" "" "$" "i" // russian "yj" "" "$" "i" // russian "ij" "" "$" "i" // russian "aue" "" "" "aue" "oue" "" "" "oue" "au" "" "" "(au|o[french])" "ou" "" "" "(ou|u[french])" "ue" "" "" "(Q|uje[russian])" "ae" "" "" "(Y[german]|aje[russian]|ae)" "oe" "" "" "(Y[german]|oje[russian]|oe)" "ee" "" "" "(i[english]|aje[russian]|e)" "ei" "" "" "aj" "ey" "" "" "aj" "eu" "" "" "(aj[german]|oj[german]|eu)" "i" "[aou]" "" "j" "y" "[aou]" "" "j" "ie" "" "[bcdgkpstwzż]" "(i[german]|e[polish]|ije[russian]|je)" "ie" "" "" "(i[german]|e[polish]|ije[russian]|je)" "ye" "" "" "(je|ije[russian])" "i" "" "[au]" "j" "y" "" "[au]" "j" "io" "" "" "(jo|e[russian])" "yo" "" "" "(jo|e[russian])" "ea" "" "" "(ea|ja[romanian])" "e" "^" "" "(e|je[russian])" "oo" "" "" "(u[english]|o)" "uu" "" "" "u" // LANGUAGE SPECIFIC CHARACTERS "ć" "" "" "(tS[polish]|ts)" // polish "ł" "" "" "l" // polish "ń" "" "" "n" // polish "ñ" "" "" "(n|nj[spanish])" "ś" "" "" "(S[polish]|s)" // polish "ş" "" "" "S" // romanian "ţ" "" "" "ts" // romanian "ż" "" "" "Z" // polish "ź" "" "" "(Z[polish]|z)" // polish "où" "" "" "u" // french "ą" "" "[bp]" "om" // polish "ą" "" "" "on" // polish "ä" "" "" "(Y|e)" // german "á" "" "" "a" // hungarian "ă" "" "" "(e[romanian]|a)" //romanian "à" "" "" "a" // french "â" "" "" "a" //french+romanian "é" "" "" "e" "è" "" "" "e" // french "ê" "" "" "e" // french "ę" "" "[bp]" "em" // polish "ę" "" "" "en" // polish "í" "" "" "i" "î" "" "" "i" "ö" "" "" "Y" "ő" "" "" "Y" // hungarian "ó" "" "" "(u[polish]|o)" "ű" "" "" "Q" "ü" "" "" "Q" "ú" "" "" "u" "ű" "" "" "Q" // hungarian "ß" "" "" "s" // german "'" "" "" "" "\"" "" "" "" "a" "" "[bcdgkpstwzż]" "(A|B[polish])" "e" "" "[bcdgkpstwzż]" "(E|F[polish])" "o" "" "[bcćdgklłmnńrsśtwzźż]" "(O|P[polish])" // LATIN ALPHABET "a" "" "" "A" "b" "" "" "b" "c" "" "" "(k|ts[polish])" "d" "" "" "d" "e" "" "" "E" "f" "" "" "f" "g" "" "" "g" "h" "" "" "h" "i" "" "" "I" "j" "" "" "j" "k" "" "" "k" "l" "" "" "l" "m" "" "" "m" "n" "" "" "n" "o" "" "" "O" "p" "" "" "p" "q" "" "" "k" "r" "" "" "r" "s" "" "" "s" "t" "" "" "t" "u" "" "" "U" "v" "" "" "v" "w" "" "" "v" // English disabled "x" "" "" "ks" "y" "" "" "i" "z" "" "" "(ts[german]|z)"