public abstract class AnalysisFactoryTestCase extends ESTestCase { static final Map> KNOWN_TOKENFILTERS = new MapBuilder>() .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .put("apostrophe") .put("arabicnormalization") .put("arabicstem") .put("asciifolding") .put("bengalinormalization") .put("bengalistem") .put("brazilianstem") .put("bulgarianstem") .put("cjkbigram") .put("cjkwidth") .put("classic") .put("commongrams") .put("commongramsquery") .put("czechstem") .put("decimaldigit") .put("delimitedpayload") .put("dictionarycompoundword") .put("edgengram") .put("elision") .put("englishminimalstem") .put("englishpossessive") .put("finnishlightstem") .put("flattengraph") .put("frenchlightstem") .put("frenchminimalstem") .put("galicianminimalstem") .put("galicianstem") .put("germanlightstem") .put("germanminimalstem") .put("germannormalization") .put("germanstem") .put("greeklowercase") .put("greekstem") .put("hindinormalization") .put("hindistem") .put("hungarianlightstem") .put("hunspellstem") .put("hyphenationcompoundword") .put("indicnormalization") .put("indonesianstem") .put("irishlowercase") .put("italianlightstem") .put("keepword") .put("keywordmarker") .put("kstem") .put("latvianstem") .put("length") .put("limittokencount") .put("lowercase") .put("minhash") .put("ngram") .put("norwegianlightstem") .put("norwegianminimalstem") .put("patterncapturegroup") .put("patternreplace") .put("persiannormalization") .put("porterstem") .put("portugueselightstem") .put("portugueseminimalstem") .put("portuguesestem") .put("reversestring") .put("russianlightstem") .put("scandinavianfolding") .put("scandinaviannormalization") .put("serbiannormalization") .put("shingle") .put("snowballporter") .put("soraninormalization") .put("soranistem") .put("spanishlightstem") .put("standard") .put("stemmeroverride") .put("stop") .put("swedishlightstem") .put("synonym") .put("synonymgraph") .put("trim") .put("truncate") .put("turkishlowercase") .put("type") .put("uppercase") .put("worddelimiter") .put("worddelimitergraph") .immutableMap(); }