# THIS FILE IS AUTOMATICALLY GENERATED BY CARGO # # When uploading crates to the registry Cargo will automatically # "normalize" Cargo.toml files for maximal compatibility # with all versions of Cargo and also rewrite `path` dependencies # to registry (e.g., crates.io) dependencies. # # If you are reading this file be aware that the original Cargo.toml # will likely look very different (and much more reasonable). # See Cargo.toml.orig for the original contents. [package] edition = "2021" name = "charabia" version = "0.8.12" authors = ["Many "] exclude = ["dictionaries/txt/thai/words.txt"] description = "A simple library to detect the language, tokenize the text and normalize the tokens" documentation = "https://docs.rs/charabia" readme = "README.md" keywords = [ "segmenter", "tokenizer", "normalize", "language", ] categories = ["text-processing"] license = "MIT" repository = "https://github.com/meilisearch/charabia" [[bench]] name = "bench" harness = false [dependencies.aho-corasick] version = "1.1.3" [dependencies.cow-utils] version = "0.1" [dependencies.csv] version = "1.3.0" [dependencies.deunicode] version = "1.6.0" [dependencies.either] version = "1.13.0" [dependencies.finl_unicode] version = "1.2.0" optional = true [dependencies.fst] version = "0.4" [dependencies.irg-kvariants] version = "=0.1.1" [dependencies.jieba-rs] version = "0.7" optional = true [dependencies.lindera] version = "=0.32.2" optional = true default-features = false [dependencies.litemap] version = "0.7.3" [dependencies.once_cell] version = "1.19.0" [dependencies.pinyin] version = "0.10" features = ["with_tone"] optional = true default-features = false [dependencies.serde] version = "1.0" [dependencies.slice-group-by] version = "0.3.1" [dependencies.unicode-normalization] version = "0.1.23" [dependencies.wana_kana] version = "3.0.0" optional = true [dependencies.whatlang] version = "0.16.4" [dependencies.zerovec] version = "0.10.4" [dev-dependencies.criterion] version = "0.5" [dev-dependencies.jemallocator] version = "0.5.4" [dev-dependencies.quickcheck] version = "1" [dev-dependencies.quickcheck_macros] version = "1" [features] chinese = [ "chinese-segmentation", "chinese-normalization", ] chinese-normalization = [] chinese-normalization-pinyin = [ "dep:pinyin", "chinese-normalization", ] chinese-segmentation = ["dep:jieba-rs"] default = [ "chinese", "hebrew", "japanese", "thai", "korean", "greek", "latin-camelcase", "latin-snakecase", "khmer", "vietnamese", ] greek = [] hebrew = [] japanese = ["japanese-segmentation-unidic"] japanese-segmentation-ipadic = [ "lindera/ipadic", "lindera/compress", ] japanese-segmentation-unidic = [ "lindera/unidic", "lindera/compress", ] japanese-transliteration = ["dep:wana_kana"] khmer = [] korean = [ "lindera/ko-dic", "lindera/compress", ] latin-camelcase = ["dep:finl_unicode"] latin-snakecase = ["dep:finl_unicode"] swedish-recomposition = [] thai = [] vietnamese = []