optimize: batch embedding and qdrant write_consistency_factor parameter (#21776)

Co-authored-by: hobo.l <hobo.l@binance.com>
2025-07-10 10:16:59 +08:00
parent a316766ad7
commit a371390d6c
2 changed files with 20 additions and 2 deletions
--- a/api/core/rag/datasource/vdb/qdrant/qdrant_vector.py
+++ b/api/core/rag/datasource/vdb/qdrant/qdrant_vector.py
@@ -47,6 +47,7 @@ class QdrantConfig(BaseModel):
    grpc_port: int = 6334
    prefer_grpc: bool = False
    replication_factor: int = 1
+    write_consistency_factor: int = 1

    def to_qdrant_params(self):
        if self.endpoint and self.endpoint.startswith("path:"):
@@ -127,6 +128,7 @@ class QdrantVector(BaseVector):
                    hnsw_config=hnsw_config,
                    timeout=int(self._client_config.timeout),
                    replication_factor=self._client_config.replication_factor,
+                    write_consistency_factor=self._client_config.write_consistency_factor,
                )

                # create group_id payload index