chore: update allium spec for clearer wording towards embedding model
This commit is contained in:
@@ -213,6 +213,14 @@ invariant VectorCacheInDb {
|
|||||||
-- Enables instant reload without re-embedding
|
-- Enables instant reload without re-embedding
|
||||||
}
|
}
|
||||||
|
|
||||||
|
invariant RealNeuralModel {
|
||||||
|
-- Embeddings MUST be produced by the actual ONNX neural model (multilingual-e5-small),
|
||||||
|
-- not by lexical approximations (TF-IDF, bag-of-words, hash projections).
|
||||||
|
-- Cross-language semantic similarity is a primary requirement:
|
||||||
|
-- posts in different languages about the same topic must produce similar vectors.
|
||||||
|
-- This is only achievable with the trained multilingual transformer model.
|
||||||
|
}
|
||||||
|
|
||||||
invariant ModelCaching {
|
invariant ModelCaching {
|
||||||
-- Model files (~100 MB) downloaded from Hugging Face Hub on first use
|
-- Model files (~100 MB) downloaded from Hugging Face Hub on first use
|
||||||
-- Cached in app data directory, persists across sessions
|
-- Cached in app data directory, persists across sessions
|
||||||
|
|||||||
Reference in New Issue
Block a user