MeiliSearch/crates/milli/Cargo.toml

160 lines
4.6 KiB
TOML
Raw Normal View History

[package]
name = "milli"
edition = "2021"
publish = false
version.workspace = true
authors.workspace = true
description.workspace = true
homepage.workspace = true
readme.workspace = true
# edition.workspace = true
license.workspace = true
[dependencies]
big_s = "1.0.2"
bimap = { version = "0.6.3", features = ["serde"] }
bincode = "1.3.3"
2025-01-08 13:52:14 +01:00
bstr = "1.11.3"
bytemuck = { version = "1.21.0", features = ["extern_crate_alloc"] }
2024-01-16 15:05:03 +01:00
byteorder = "1.5.0"
2024-11-27 11:12:08 +01:00
charabia = { version = "0.9.2", default-features = false }
concat-arrays = "0.1.2"
2025-01-08 13:52:14 +01:00
crossbeam-channel = "0.5.14"
deserr = "0.6.3"
2024-07-08 18:09:12 +02:00
either = { version = "1.13.0", features = ["serde"] }
2022-06-02 15:46:44 +02:00
flatten-serde-json = { path = "../flatten-serde-json" }
2022-03-14 17:00:53 +01:00
fst = "0.4.7"
fxhash = "0.2.1"
2022-10-04 11:29:39 +02:00
geoutils = "0.5.1"
2024-11-25 16:31:21 +01:00
grenad = { version = "0.5.0", default-features = false, features = ["rayon", "tempfile"] }
2025-01-08 13:52:14 +01:00
heed = { version = "0.20.5", default-features = false, features = [
"serde-json",
"serde-bincode",
"read-txn-no-tls",
2023-05-15 11:42:30 +02:00
] }
2025-01-08 13:52:14 +01:00
indexmap = { version = "2.7.0", features = ["serde"] }
2022-04-12 11:22:36 +02:00
json-depth-checker = { path = "../json-depth-checker" }
2022-03-14 17:00:53 +01:00
levenshtein_automata = { version = "0.2.1", features = ["fst_automaton"] }
2025-01-08 13:52:14 +01:00
memchr = "2.7.4"
memmap2 = "0.9.5"
obkv = "0.3.0"
2025-01-08 13:52:14 +01:00
once_cell = "1.20.2"
ordered-float = "4.6.0"
2024-07-08 18:09:12 +02:00
rayon = "1.10.0"
2025-01-08 13:52:14 +01:00
roaring = { version = "0.10.10", features = ["serde"] }
rstar = { version = "0.12.2", features = ["serde"] }
serde = { version = "1.0.217", features = ["derive"] }
serde_json = { version = "1.0.135", features = ["preserve_order", "raw_value"] }
2024-01-16 15:05:03 +01:00
slice-group-by = "0.3.1"
2023-05-15 11:42:30 +02:00
smallstr = { version = "0.3.0", features = ["serde"] }
2024-07-08 18:09:12 +02:00
smallvec = "1.13.2"
smartstring = "1.0.1"
2025-01-08 13:52:14 +01:00
tempfile = "3.15.0"
2025-01-08 15:58:03 +01:00
thiserror = "2.0.9"
2025-01-08 13:52:14 +01:00
time = { version = "0.3.37", features = [
2023-05-15 11:42:30 +02:00
"serde-well-known",
"formatting",
"parsing",
"macros",
] }
2025-01-08 13:52:14 +01:00
uuid = { version = "1.11.0", features = ["v4"] }
filter-parser = { path = "../filter-parser" }
# documents words self-join
2025-01-08 15:58:03 +01:00
itertools = "0.14.0"
2025-01-08 13:52:14 +01:00
csv = "1.3.1"
2025-01-08 15:58:03 +01:00
candle-core = { version = "0.8.2" }
candle-transformers = { version = "0.8.2" }
candle-nn = { version = "0.8.2" }
2024-06-13 17:47:44 +02:00
tokenizers = { git = "https://github.com/huggingface/tokenizers.git", tag = "v0.15.2", version = "0.15.2", default-features = false, features = [
2024-03-05 11:05:20 +01:00
"onig",
] }
2024-06-13 17:47:44 +02:00
hf-hub = { git = "https://github.com/dureuill/hf-hub.git", branch = "rust_tls", default-features = false, features = [
"online",
] }
2025-01-08 15:58:03 +01:00
tiktoken-rs = "0.6.0"
2025-01-08 13:52:14 +01:00
liquid = "0.26.9"
rhai = { git = "https://github.com/rhaiscript/rhai", rev = "ef3df63121d27aacd838f366f2b83fd65f20a1e4", features = [
2024-10-03 18:08:09 +02:00
"serde",
"no_module",
"no_custom_syntax",
"no_time",
"sync",
] }
2024-09-30 13:12:01 +02:00
arroy = "0.5.0"
2023-12-07 13:33:15 +01:00
rand = "0.8.5"
2025-01-08 13:52:14 +01:00
tracing = "0.1.41"
ureq = { version = "2.12.1", features = ["json"] }
url = "2.5.4"
2024-05-12 14:45:25 +02:00
rayon-par-bridge = "0.1.0"
2025-01-08 13:52:14 +01:00
hashbrown = "0.15.2"
2024-10-03 18:08:09 +02:00
bumpalo = "3.16.0"
2025-01-08 13:52:14 +01:00
bumparaw-collections = "0.1.4"
thread_local = "1.1.8"
2025-01-08 13:52:14 +01:00
allocator-api2 = "0.2.21"
rustc-hash = "2.1.0"
2024-11-07 15:05:20 +01:00
uell = "0.1.0"
enum-iterator = "2.1.0"
bbqueue = { git = "https://github.com/meilisearch/bbqueue" }
flume = { version = "0.11.1", default-features = false }
2025-01-08 13:52:14 +01:00
utoipa = { version = "5.3.1", features = ["non_strict_integers", "preserve_order", "uuid", "time", "openapi_extensions"] }
[dev-dependencies]
2024-07-08 18:09:12 +02:00
mimalloc = { version = "0.1.43", default-features = false }
2025-01-08 15:18:08 +01:00
# fixed version due to format breakages in v1.40
insta = "=1.39.0"
maplit = "1.0.2"
md5 = "0.7.0"
2023-09-18 09:59:38 +02:00
meili-snap = { path = "../meili-snap" }
2023-05-15 11:42:30 +02:00
rand = { version = "0.8.5", features = ["small_rng"] }
[features]
2024-01-25 18:58:52 +01:00
all-tokenizations = [
"charabia/default",
2024-01-25 18:58:52 +01:00
]
2022-09-08 12:19:44 +02:00
# Use POSIX semaphores instead of SysV semaphores in LMDB
# For more information on this feature, see heed's Cargo.toml
lmdb-posix-sem = ["heed/posix-sem"]
2022-09-08 12:19:44 +02:00
# allow chinese specialized tokenization
chinese = ["charabia/chinese"]
2024-04-18 11:38:26 +02:00
chinese-pinyin = ["chinese", "charabia/chinese-normalization-pinyin"]
2022-09-08 12:19:44 +02:00
# allow hebrew specialized tokenization
hebrew = ["charabia/hebrew"]
# allow japanese specialized tokenization
japanese = ["charabia/japanese"]
2022-12-12 14:53:08 +01:00
japanese-transliteration = ["charabia/japanese-transliteration"]
# allow korean specialized tokenization
korean = ["charabia/korean"]
2022-09-08 12:19:44 +02:00
# allow thai specialized tokenization
thai = ["charabia/thai"]
2023-04-26 14:56:54 +02:00
# allow greek specialized tokenization
2023-04-26 14:58:32 +02:00
greek = ["charabia/greek"]
2023-10-26 17:01:10 +02:00
# allow khmer specialized tokenization
khmer = ["charabia/khmer"]
2024-01-07 21:27:29 +01:00
2024-04-30 14:30:23 +02:00
# allow vietnamese specialized tokenization
2024-01-25 18:58:52 +01:00
vietnamese = ["charabia/vietnamese"]
2024-09-19 13:30:07 +02:00
# allow german specialized tokenization
german = ["charabia/german-segmentation"]
2024-04-30 14:30:23 +02:00
# force swedish character recomposition
swedish-recomposition = ["charabia/swedish-recomposition"]
2024-09-25 11:03:17 +02:00
# allow turkish specialized tokenization
turkish = ["charabia/turkish"]
2024-01-22 10:13:27 +01:00
# allow CUDA support, see <https://github.com/meilisearch/meilisearch/issues/4306>
2024-01-07 21:27:29 +01:00
cuda = ["candle-core/cuda"]