aboutsummaryrefslogtreecommitdiff
path: root/.venv/lib/python3.12/site-packages/shared/abstractions/embedding.py
blob: 6e27da280ad326b1c7425adce648f62613a8d461 (about) (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
from enum import Enum, auto


class EmbeddingPurpose(str, Enum):
    INDEX = auto()
    QUERY = auto()
    DOCUMENT = auto()


default_embedding_prefixes = {
    "nomic-embed-text-v1.5": {
        EmbeddingPurpose.INDEX: "",
        EmbeddingPurpose.QUERY: "search_query: ",
        EmbeddingPurpose.DOCUMENT: "search_document: ",
    },
    "nomic-embed-text": {
        EmbeddingPurpose.INDEX: "",
        EmbeddingPurpose.QUERY: "search_query: ",
        EmbeddingPurpose.DOCUMENT: "search_document: ",
    },
    "mixedbread-ai/mxbai-embed-large-v1": {
        EmbeddingPurpose.INDEX: "",
        EmbeddingPurpose.QUERY: "Represent this sentence for searching relevant passages: ",
        EmbeddingPurpose.DOCUMENT: "Represent this sentence for searching relevant passages: ",
    },
    "mixedbread-ai/mxbai-embed-large": {
        EmbeddingPurpose.INDEX: "",
        EmbeddingPurpose.QUERY: "Represent this sentence for searching relevant passages: ",
        EmbeddingPurpose.DOCUMENT: "Represent this sentence for searching relevant passages: ",
    },
}