Merge pull request #158 from AlpinDale/embeddings

feat: add embeddings support via Infinity-emb
This commit is contained in:
Brian Dashore 2024-07-31 20:33:12 -04:00 committed by GitHub
commit 1bf062559d
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
14 changed files with 443 additions and 11 deletions

View file

@ -201,3 +201,19 @@ model:
#loras:
#- name: lora1
# scaling: 1.0
# Options for embedding models and loading.
# NOTE: Embeddings requires the "extras" feature to be installed
# Install it via "pip install .[extras]"
embeddings:
# Overrides directory to look for embedding models (default: models)
embedding_model_dir: models
# An initial embedding model to load on the infinity backend (default: None)
embedding_model_name:
# Device to load embedding models on (default: cpu)
# Possible values: cpu, auto, cuda
# NOTE: It's recommended to load embedding models on the CPU.
# If you'd like to load on an AMD gpu, set this value to "cuda" as well.
embeddings_device: cpu