From f2c4094e614397edeb80bd0e95394b8ecfc00d47 Mon Sep 17 00:00:00 2001 From: Vishakha Gupta-Cledat Date: Mon, 25 Nov 2024 01:49:02 -0800 Subject: [PATCH 1/6] Introduce ApertureDB information --- docs/tools/vdb_table/data/aperturedb.json | 78 +++++++++++------------ 1 file changed, 39 insertions(+), 39 deletions(-) diff --git a/docs/tools/vdb_table/data/aperturedb.json b/docs/tools/vdb_table/data/aperturedb.json index 8dea1b22..68581e21 100644 --- a/docs/tools/vdb_table/data/aperturedb.json +++ b/docs/tools/vdb_table/data/aperturedb.json @@ -9,42 +9,42 @@ "slug": "aperturedb" }, "oss": { - "support": "", - "source_url": "", - "comment": "" + "support": "community", + "source_url": "https://hub.docker.com/r/aperturedata/aperturedb-community", + "comment": "ApertureDB community is a great way to test all the database features, locally." }, "license": { - "value": "", + "value": "Proprietary", "source_url": "", "comment": "" }, "dev_languages": { "value": [ - "" + "C++" ], "source_url": "", "comment": "" }, - "vector_launch_year": 0, + "vector_launch_year": 2021, "metadata_filter": { - "support": "", - "source_url": "", - "comment": "" + "support": "full", + "source_url": "https://docs.aperturedata.io/concepts/Schema", + "comment": "Complete graph database support alongside vector search" }, "hybrid_search": { - "support": "", + "support": "full", "source_url": "", - "comment": "" + "comment": "Blending graph filtering with vector search. Easy to introduce search algorithms" }, "facets": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, "geo_search": { - "support": "", + "support": "partial", "source_url": "", - "comment": "" + "comment": "Coordinates can be represented in metadata or as embeddings" }, "multi_vec": { "support": "", @@ -52,7 +52,7 @@ "comment": "" }, "sparse_vectors": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, @@ -67,14 +67,14 @@ "comment": "" }, "embeddings_text": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, "embeddings_image": { - "support": "", + "support": "full", "source_url": "", - "comment": "" + "comment": "Supports multimodal embeddings in general including video" }, "embeddings_structured": { "support": "", @@ -82,34 +82,34 @@ "comment": "" }, "rag": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, "recsys": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, "langchain": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, "llamaindex": { - "support": "", + "support": "full", "source_url": "", - "comment": "" + "comment": "Yet to contribute upstream" }, "managed_cloud": { - "support": "", + "support": "full", "source_url": "", - "comment": "" + "comment": "VPC options available as well" }, "pricing": { - "value": "", - "source_url": "", - "comment": "" + "value": "full", + "source_url": "http://aperturedata.io/pricing", + "comment": "Offers free trial" }, "in_process": { "support": "none", @@ -117,7 +117,7 @@ "comment": "" }, "multi_tenancy": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, @@ -127,33 +127,33 @@ "comment": "" }, "ephemeral": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, "sharding": { - "support": "", + "support": "full", "source_url": "", "comment": "" }, "doc_size": { "bytes": 0, - "unlimited": false, - "source_url": "", - "comment": "" + "unlimited": true, + "source_url": "https://docs.aperturedata.io/administration/Distributed%20aperturedb", + "comment": "Multimodal data stored in a horizontally scalable ApertureDB deployment, not limited in count of objects." }, "vector_dims": { "value": 0, "unlimited": true, "source_url": "", - "comment": "" + "comment": "Unlimited. Commonly tested 4096 dims" }, "index_types": { "value": [ - "HNSW" + "HNSW", "FLAT", "IVF" ], - "source_url": "", - "comment": "" + "source_url": "https://docs.aperturedata.io/query_language/reference/descriptor_commands/desc_set_commands/AddDescriptorSet", + "comment": "New indexes introduced as needed. Multiple distance metrics supported." }, "github_stars": { "value": 0, @@ -185,4 +185,4 @@ "comment": "", "value_90_days": 0 } -} \ No newline at end of file +} From 2c311e6d30830db91ad39b34d868a844a3583ce1 Mon Sep 17 00:00:00 2001 From: Vishakha Gupta-Cledat Date: Thu, 12 Dec 2024 17:26:19 -0800 Subject: [PATCH 2/6] Introduce source urls --- docs/tools/vdb_table/data/aperturedb.json | 68 +++++++++++------------ 1 file changed, 34 insertions(+), 34 deletions(-) diff --git a/docs/tools/vdb_table/data/aperturedb.json b/docs/tools/vdb_table/data/aperturedb.json index cf149c00..434c3186 100644 --- a/docs/tools/vdb_table/data/aperturedb.json +++ b/docs/tools/vdb_table/data/aperturedb.json @@ -15,14 +15,14 @@ }, "license": { "value": "Proprietary", - "source_url": "", - "comment": "" + "source_url": "https://github.com/aperture-data", + "comment": "ApertureDB code is proprietary but we have open source clients, dataset, and applications repositories." }, "dev_languages": { "value": [ - "C++" + "c++" ], - "source_url": "", + "source_url": "https://github.com/aperture-data", "comment": "" }, "vector_launch_year": 2021, @@ -33,27 +33,27 @@ }, "hybrid_search": { "support": "full", - "source_url": "", - "comment": "Blending graph filtering with vector search. Easy to introduce search algorithms" + "source_url": "https://docs.aperturedata.io/python_sdk/object_wrappers/Descriptors", + "comment": "Blending graph filtering with vector search. Easy to introduce search algorithms. You can search across multiple embedding sets as well (collections)" }, "facets": { "support": "full", - "source_url": "", + "source_url": "https://docs.aperturedata.io/query_language/Reference/shared_command_parameters/constraints", "comment": "" }, "geo_search": { "support": "partial", - "source_url": "", + "source_url": "https://docs.aperturedata.io/HowToGuides/start/Embeddings", "comment": "Coordinates can be represented in metadata or as embeddings" }, "multi_vec": { - "support": "", - "source_url": "", - "comment": "" + "support": "full", + "source_url": "https://docs.aperturedata.io/HowToGuides/Applications/similarity_search#all-of-the-above-and-some-more-can-be-done-by-executing-this-through-adb-cli", + "comment": "You can attach multiple embeddings per source of data for multimodal data types in different embeddings collections or within the same (regions of interest or full data embeddings)." }, "sparse_vectors": { "support": "full", - "source_url": "", + "source_url": "https://docs.aperturedata.io/query_language/Reference/descriptor_commands/desc_set_commands/AddDescriptorSet", "comment": "" }, "bm25": { @@ -68,43 +68,43 @@ }, "embeddings_text": { "support": "full", - "source_url": "", - "comment": "" + "source_url": "https://docs.aperturedata.io/HowToGuides/Applications/semantic_search/website_ingest", + "comment": "We use text embeddings in ApertureDB vector store for our documentation chatbot." }, "embeddings_image": { "support": "full", - "source_url": "", - "comment": "Supports multimodal embeddings in general including video" + "source_url": "https://docs.aperturedata.io/HowToGuides/Advanced/Image%20Similarity%20Search", + "comment": "Supports multimodal embeddings in general including for videos." }, "embeddings_structured": { - "support": "", - "source_url": "", - "comment": "" + "support": "partial", + "source_url": "https://docs.aperturedata.io/query_language/Reference/descriptor_commands/desc_commands/AddDescriptor", + "comment": "ApertureDB vector store can store embeddings from any source but we don't generate them ourselves." }, "rag": { "support": "full", - "source_url": "", - "comment": "" + "source_url": "https://docs.aperturedata.io/category/chatbot-with-langchain-and-aperturedb", + "comment": "You can build hybrid-RAG with our graph-vector search." }, "recsys": { - "support": "full", - "source_url": "", - "comment": "" + "support": "partial", + "source_url": "https://docs.aperturedata.io/HowToGuides/Applications/similarity_search", + "comment": "Recommendations can be built using our KNN and metadata search support." }, "langchain": { "support": "full", - "source_url": "", + "source_url": "https://docs.aperturedata.io/Integrations/langchain_howto", "comment": "" }, "llamaindex": { "support": "full", - "source_url": "", - "comment": "Yet to contribute upstream" + "source_url": "https://github.com/aperture-data/llama_index", + "comment": "Yet to contribute upstream but deployed with customer" }, "managed_cloud": { "support": "full", - "source_url": "", - "comment": "VPC options available as well" + "source_url": "https://cloud.aperturedata.io/", + "comment": "VPC options and community edition available as well" }, "pricing": { "value": "full", @@ -119,7 +119,7 @@ "multi_tenancy": { "support": "full", "source_url": "", - "comment": "" + "comment": "Not documented externally." }, "disk_index": { "support": "", @@ -129,12 +129,12 @@ "ephemeral": { "support": "full", "source_url": "", - "comment": "" + "comment": "Not documented externally." }, "sharding": { "support": "full", "source_url": "", - "comment": "" + "comment": "Not documented externally." }, "doc_size": { "bytes": 0, @@ -145,8 +145,8 @@ "vector_dims": { "value": 0, "unlimited": true, - "source_url": "", - "comment": "Unlimited. Commonly tested 4096 dims" + "source_url": "https://docs.aperturedata.io/query_language/reference/descriptor_commands/desc_set_commands/AddDescriptorSet", + "comment": "Unlimited. Currently tested up to 4096 dims" }, "index_types": { "value": [ From 2a1aca2dcfbd88c87e609e3146ee36741f44e43a Mon Sep 17 00:00:00 2001 From: Vishakha Gupta-Cledat Date: Thu, 12 Dec 2024 23:42:52 -0800 Subject: [PATCH 3/6] Fix oss value to match allowed --- docs/tools/vdb_table/data/aperturedb.json | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/docs/tools/vdb_table/data/aperturedb.json b/docs/tools/vdb_table/data/aperturedb.json index 8665e68f..b800712c 100644 --- a/docs/tools/vdb_table/data/aperturedb.json +++ b/docs/tools/vdb_table/data/aperturedb.json @@ -9,9 +9,9 @@ "slug": "aperturedb" }, "oss": { - "support": "community", + "support": "partial", "source_url": "https://hub.docker.com/r/aperturedata/aperturedb-community", - "comment": "ApertureDB community is a great way to test all the database features, locally." + "comment": "ApertureDB community edition is free and a great way to test all the database features, locally." }, "license": { "value": "Proprietary", From 2ecefe8010b1c1885dd43492a343236a3ab20e04 Mon Sep 17 00:00:00 2001 From: Vishakha Gupta-Cledat <24485122+vishakha041@users.noreply.github.com> Date: Thu, 19 Dec 2024 12:42:29 -0800 Subject: [PATCH 4/6] Update aperturedb.json for review comments --- docs/tools/vdb_table/data/aperturedb.json | 66 +++++++++++------------ 1 file changed, 33 insertions(+), 33 deletions(-) diff --git a/docs/tools/vdb_table/data/aperturedb.json b/docs/tools/vdb_table/data/aperturedb.json index b800712c..0d059231 100644 --- a/docs/tools/vdb_table/data/aperturedb.json +++ b/docs/tools/vdb_table/data/aperturedb.json @@ -32,28 +32,28 @@ "comment": "Complete graph database support alongside vector search" }, "hybrid_search": { - "support": "full", - "source_url": "https://docs.aperturedata.io/python_sdk/object_wrappers/Descriptors", - "comment": "Blending graph filtering with vector search. Easy to introduce search algorithms. You can search across multiple embedding sets as well (collections)" + "support": "", + "source_url": "", + "comment": "" }, "facets": { "support": "full", - "source_url": "https://docs.aperturedata.io/query_language/Reference/shared_command_parameters/constraints", - "comment": "" + "source_url": "https://docs.aperturedata.io/query_language/Reference/shared_command_parameters/results", + "comment": "Results can be aggregated on property values" }, "geo_search": { - "support": "partial", - "source_url": "https://docs.aperturedata.io/HowToGuides/start/Embeddings", - "comment": "Coordinates can be represented in metadata or as embeddings" + "support": "", + "source_url": "", + "comment": "" }, "multi_vec": { - "support": "full", + "support": "partial", "source_url": "https://docs.aperturedata.io/HowToGuides/Applications/similarity_search#all-of-the-above-and-some-more-can-be-done-by-executing-this-through-adb-cli", "comment": "You can attach multiple embeddings per source of data for multimodal data types in different embeddings collections or within the same (regions of interest or full data embeddings)." }, "sparse_vectors": { - "support": "full", - "source_url": "https://docs.aperturedata.io/query_language/Reference/descriptor_commands/desc_set_commands/AddDescriptorSet", + "support": "", + "source_url": "", "comment": "" }, "bm25": { @@ -68,28 +68,28 @@ }, "embeddings_text": { "support": "full", - "source_url": "https://docs.aperturedata.io/HowToGuides/Applications/semantic_search/website_ingest", - "comment": "We use text embeddings in ApertureDB vector store for our documentation chatbot." + "source_url": "https://docs.aperturedata.io/HowToGuides/Ingestion/Updates#transformations-while-loading", + "comment": "You can plug-in user-defined or off-the-shelf text embedding models when adding text blobs in the form of new generators" }, "embeddings_image": { "support": "full", - "source_url": "https://docs.aperturedata.io/HowToGuides/Advanced/Image%20Similarity%20Search", - "comment": "Supports multimodal embeddings in general including for videos." + "source_url": "https://docs.aperturedata.io/HowToGuides/Ingestion/Updates#transformations-while-loading", + "comment": "You can plug-in user-defined or off-the-shelf image embedding models when adding images to introduce any number of embedding per image, in different collections" }, "embeddings_structured": { - "support": "partial", - "source_url": "https://docs.aperturedata.io/query_language/Reference/descriptor_commands/desc_commands/AddDescriptor", - "comment": "ApertureDB vector store can store embeddings from any source but we don't generate them ourselves." + "support": "", + "source_url": "", + "comment": "" }, "rag": { - "support": "full", - "source_url": "https://docs.aperturedata.io/category/chatbot-with-langchain-and-aperturedb", - "comment": "You can build hybrid-RAG with our graph-vector search." + "support": "", + "source_url": "", + "comment": "" }, "recsys": { - "support": "partial", - "source_url": "https://docs.aperturedata.io/HowToGuides/Applications/similarity_search", - "comment": "Recommendations can be built using our KNN and metadata search support." + "support": "", + "source_url": "", + "comment": "" }, "langchain": { "support": "full", @@ -97,7 +97,7 @@ "comment": "" }, "llamaindex": { - "support": "full", + "support": "partial", "source_url": "https://github.com/aperture-data/llama_index", "comment": "Yet to contribute upstream but deployed with customer" }, @@ -107,9 +107,9 @@ "comment": "VPC options and community edition available as well" }, "pricing": { - "value": "full", + "value": "Instance-based hourly (cloud) or annual (VPC) pricing with free trial", "source_url": "http://aperturedata.io/pricing", - "comment": "Offers free trial" + "comment": "Priced generally by number of database instances, support level, and resource tier. Free trial and cloud pricing are on website. Custom pricing for VPC deployments." }, "in_process": { "support": "none", @@ -117,9 +117,9 @@ "comment": "" }, "multi_tenancy": { - "support": "full", + "support": "", "source_url": "", - "comment": "Not documented externally." + "comment": "" }, "disk_index": { "support": "", @@ -127,20 +127,20 @@ "comment": "" }, "ephemeral": { - "support": "full", + "support": "partial", "source_url": "", "comment": "Not documented externally." }, "sharding": { - "support": "full", + "support": "partial", "source_url": "", "comment": "Not documented externally." }, "doc_size": { "bytes": 0, "unlimited": true, - "source_url": "https://docs.aperturedata.io/administration/Distributed%20aperturedb", - "comment": "Multimodal data stored in a horizontally scalable ApertureDB deployment, not limited in count of objects." + "source_url": "https://docs.aperturedata.io/administration/Configuring%20ApertureDB", + "comment": "You can store large or small files but need to change message size for adding or querying files larger than 256MB. For very large files like GBs of video, it will require optimizations to send over network or would be slow." }, "vector_dims": { "value": 0, From 9bee296d16118d78dab22782edb92999f557e71d Mon Sep 17 00:00:00 2001 From: svonava Date: Thu, 19 Dec 2024 16:22:55 -0800 Subject: [PATCH 5/6] Update docs/tools/vdb_table/data/aperturedb.json Co-authored-by: Prashanth Rao <35005448+prrao87@users.noreply.github.com> --- docs/tools/vdb_table/data/aperturedb.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/tools/vdb_table/data/aperturedb.json b/docs/tools/vdb_table/data/aperturedb.json index a30d9cac..6241836e 100644 --- a/docs/tools/vdb_table/data/aperturedb.json +++ b/docs/tools/vdb_table/data/aperturedb.json @@ -152,7 +152,7 @@ "value": [ "HNSW", "FLAT", "IVF" ], - "source_url": "https://docs.aperturedata.io/query_language/reference/descriptor_commands/desc_set_commands/AddDescriptorSet", + "source_url": "https://docs.aperturedata.io/query_language/Reference/descriptor_commands/desc_set_commands/AddDescriptorSet#details", "comment": "New indexes introduced as needed. Multiple distance metrics supported." }, "github_stars": { From 81621604bef238acaf1e8e816a1c1ebc34be85c9 Mon Sep 17 00:00:00 2001 From: svonava Date: Thu, 19 Dec 2024 16:23:01 -0800 Subject: [PATCH 6/6] Update docs/tools/vdb_table/data/aperturedb.json Co-authored-by: Prashanth Rao <35005448+prrao87@users.noreply.github.com> --- docs/tools/vdb_table/data/aperturedb.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/tools/vdb_table/data/aperturedb.json b/docs/tools/vdb_table/data/aperturedb.json index 6241836e..cd133c91 100644 --- a/docs/tools/vdb_table/data/aperturedb.json +++ b/docs/tools/vdb_table/data/aperturedb.json @@ -140,7 +140,7 @@ "bytes": 0, "unlimited": true, "source_url": "https://docs.aperturedata.io/administration/Configuring%20ApertureDB", - "comment": "You can store large or small files but need to change message size for adding or querying files larger than 256MB. For very large files like GBs of video, it will require optimizations to send over network or would be slow." + "comment": "You can store large or small files but need to change the `max_connection_message_size_mb` for adding or querying files larger than 256MB. For very large files like GBs of video, it will require optimizations to send over network or would be slow." }, "vector_dims": { "value": 0,