diff --git a/examples/llm/vdb_upload/vdb_utils.py b/examples/llm/vdb_upload/vdb_utils.py index d3aed615d7..7740acbc7c 100644 --- a/examples/llm/vdb_upload/vdb_utils.py +++ b/examples/llm/vdb_upload/vdb_utils.py @@ -315,14 +315,15 @@ def build_cli_configs(source_type, cli_vdb_conf = { # Vector db upload has some significant transaction overhead, batch size here should be as large as possible 'batch_size': 16384, - 'resource_name': vector_db_resource_name, 'embedding_size': embedding_size, 'recreate': True, + 'resource_name': vector_db_resource_name, 'resource_schemas': { vector_db_resource_name: build_defualt_milvus_config(embedding_size) if (vector_db_service == 'milvus') else None, }, 'service': vector_db_service, + 'truncate_long_strings': True, 'uri': vector_db_uri, } diff --git a/morpheus/service/vdb/milvus_vector_db_service.py b/morpheus/service/vdb/milvus_vector_db_service.py index b9797ce8f0..1a1fd74be5 100644 --- a/morpheus/service/vdb/milvus_vector_db_service.py +++ b/morpheus/service/vdb/milvus_vector_db_service.py @@ -605,13 +605,17 @@ def __init__(self, password: str = "", db_name: str = "", token: str = "", + truncate_long_strings: bool = False, **kwargs: dict[str, typing.Any]): + self._truncate_long_strings = truncate_long_strings self._client = MilvusClient(uri=uri, user=user, password=password, db_name=db_name, token=token, **kwargs) def load_resource(self, name: str, **kwargs: dict[str, typing.Any]) -> MilvusVectorDBResourceService: - - return MilvusVectorDBResourceService(name=name, client=self._client, **kwargs) + return MilvusVectorDBResourceService(name=name, + client=self._client, + truncate_long_strings=self._truncate_long_strings, + **kwargs) def has_store_object(self, name: str) -> bool: """