diff --git a/autorag/vectordb/milvus.py b/autorag/vectordb/milvus.py index b05d1cf80..7a4a1c9f0 100644 --- a/autorag/vectordb/milvus.py +++ b/autorag/vectordb/milvus.py @@ -24,7 +24,7 @@ def __init__( embedding_model: str, collection_name: str, embedding_batch: int = 100, - similarity_metric: str = "l2", + similarity_metric: str = "cosine", index_type: str = "IVF_FLAT", uri: str = "http://localhost:19530", db_name: str = "", diff --git a/docs/source/integration/vectordb/milvus.md b/docs/source/integration/vectordb/milvus.md index ab759df82..b5d5b20e2 100644 --- a/docs/source/integration/vectordb/milvus.md +++ b/docs/source/integration/vectordb/milvus.md @@ -15,6 +15,10 @@ To use the Milvus vector database, you need to configure it in your YAML configu token: ${MILVUS_TOKEN} embedding_batch: 50 similarity_metric: cosine + index_type: IVF_FLAT + params: + nlist: 16384 + ``` Here is a simple example of a YAML configuration file that uses the Milvus vector database and the OpenAI: @@ -29,6 +33,9 @@ vectordb: token: ${MILVUS_TOKEN} embedding_batch: 50 similarity_metric: cosine + index_type: IVF_FLAT + params: + nlist: 16384 node_lines: - node_line_name: retrieve_node_line # Arbitrary node line name nodes: