mongodb-developer
diff --git a/‎README.md
+19-152 b/‎README.md
+19-152
diff --git a/‎apps/README.md
+1 b/‎apps/README.md
+1
diff --git a/‎apps/graph_rag_demo/data_insert.py
+33-20 b/‎apps/graph_rag_demo/data_insert.py
+33-20
diff --git a/‎apps/local-rag-pdf/rag_module.py
+42-25 b/‎apps/local-rag-pdf/rag_module.py
+42-25
diff --git a/‎misc/README.md
+1 b/‎misc/README.md
+1
diff --git a/‎snippets/ai_content_service/README.md ‎misc/ai_content_service/README.md b/‎snippets/ai_content_service/README.md ‎misc/ai_content_service/README.md
diff --git a/‎snippets/low-code/BuildShip.md ‎misc/low-code/BuildShip.md b/‎snippets/low-code/BuildShip.md ‎misc/low-code/BuildShip.md
diff --git a/‎snippets/low-code/Buildship-BookingAgent.png ‎misc/low-code/Buildship-BookingAgent.png b/‎snippets/low-code/Buildship-BookingAgent.png ‎misc/low-code/Buildship-BookingAgent.png
diff --git a/‎snippets/mongosh_embeddings/README.md ‎misc/mongosh_embeddings/README.md b/‎snippets/mongosh_embeddings/README.md ‎misc/mongosh_embeddings/README.md
diff --git a/‎notebooks/README.md
+5 b/‎notebooks/README.md
+5
diff --git a/‎notebooks/advanced_techniques/README.md
+1 b/‎notebooks/advanced_techniques/README.md
+1
diff --git a/‎notebooks/techniques/advanced_evaluation_of_quantized_vectors_using_cohere_mongodb_beir.ipynb ‎notebooks/advanced_techniques/advanced_evaluation_of_quantized_vectors_using_cohere_mongodb_beir.ipynb b/‎notebooks/techniques/advanced_evaluation_of_quantized_vectors_using_cohere_mongodb_beir.ipynb ‎notebooks/advanced_techniques/advanced_evaluation_of_quantized_vectors_using_cohere_mongodb_beir.ipynb
diff --git a/‎notebooks/techniques/automatic_quantization_of_nomic_emebddings_with_mongodb.ipynb ‎notebooks/advanced_techniques/automatic_quantization_of_nomic_emebddings_with_mongodb.ipynb b/‎notebooks/techniques/automatic_quantization_of_nomic_emebddings_with_mongodb.ipynb ‎notebooks/advanced_techniques/automatic_quantization_of_nomic_emebddings_with_mongodb.ipynb
diff --git a/‎notebooks/techniques/evaluating_information_retrival_techniques_mongondb_langchain.ipynb ‎notebooks/advanced_techniques/evaluating_information_retrival_techniques_mongondb_langchain.ipynb b/‎notebooks/techniques/evaluating_information_retrival_techniques_mongondb_langchain.ipynb ‎notebooks/advanced_techniques/evaluating_information_retrival_techniques_mongondb_langchain.ipynb
diff --git a/‎tools/function_calling_mongodb_as_a_toolbox.ipynb ‎notebooks/advanced_techniques/function_calling_mongodb_as_a_toolbox.ipynb b/‎tools/function_calling_mongodb_as_a_toolbox.ipynb ‎notebooks/advanced_techniques/function_calling_mongodb_as_a_toolbox.ipynb
diff --git a/‎notebooks/mongodb-specific/geospatialqueries_vectorsearch_spritzes.ipynb ‎notebooks/advanced_techniques/geospatialqueries_vectorsearch_spritzes.ipynb
+3-1 b/‎notebooks/mongodb-specific/geospatialqueries_vectorsearch_spritzes.ipynb ‎notebooks/advanced_techniques/geospatialqueries_vectorsearch_spritzes.ipynb
+3-1
diff --git a/‎notebooks/techniques/langchain_parent_document_retrieval.ipynb ‎notebooks/advanced_techniques/langchain_parent_document_retrieval.ipynb b/‎notebooks/techniques/langchain_parent_document_retrieval.ipynb ‎notebooks/advanced_techniques/langchain_parent_document_retrieval.ipynb
diff --git a/‎notebooks/techniques/quantized_vector_ingestion_with_cohere_and_mongodb.ipynb ‎notebooks/advanced_techniques/quantized_vector_ingestion_with_cohere_and_mongodb.ipynb b/‎notebooks/techniques/quantized_vector_ingestion_with_cohere_and_mongodb.ipynb ‎notebooks/advanced_techniques/quantized_vector_ingestion_with_cohere_and_mongodb.ipynb
diff --git a/‎notebooks/techniques/retrieval_strategies_mongodb_llamaindex.ipynb ‎notebooks/advanced_techniques/retrieval_strategies_mongodb_llamaindex.ipynb
+1-1 b/‎notebooks/techniques/retrieval_strategies_mongodb_llamaindex.ipynb ‎notebooks/advanced_techniques/retrieval_strategies_mongodb_llamaindex.ipynb
+1-1
diff --git a/‎notebooks/techniques/retrieval_strategies_mongodb_llamaindex_togetherai.ipynb ‎notebooks/advanced_techniques/retrieval_strategies_mongodb_llamaindex_togetherai.ipynb
+1-1 b/‎notebooks/techniques/retrieval_strategies_mongodb_llamaindex_togetherai.ipynb ‎notebooks/advanced_techniques/retrieval_strategies_mongodb_llamaindex_togetherai.ipynb
+1-1
diff --git a/‎notebooks/agents/MongoDB_Haystack_self_reflecting_Cooking_agent.ipynb
+4-1 b/‎notebooks/agents/MongoDB_Haystack_self_reflecting_Cooking_agent.ipynb
+4-1
diff --git a/‎notebooks/agents/README.md
+1 b/‎notebooks/agents/README.md
+1
diff --git a/‎notebooks/agents/how_to_build_ai_agent_claude_3_5_sonnet_llamaindex_mongodb.ipynb
+3-1 b/‎notebooks/agents/how_to_build_ai_agent_claude_3_5_sonnet_llamaindex_mongodb.ipynb
+3-1
diff --git a/‎notebooks/agents/how_to_build_ai_agent_openai_llamaindex_mongodb.ipynb
+3-1 b/‎notebooks/agents/how_to_build_ai_agent_openai_llamaindex_mongodb.ipynb
+3-1
@@ -0,0 +1 @@
+Javascript and Python apps and demos showcasing how to use MongoDB in GenAI applications.
@@ -1,55 +1,66 @@
-from langchain_core.documents import Document
-from langchain_community.graphs.graph_document import GraphDocument, Node, Relationship
-from pymongo import MongoClient
-from dotenv import load_dotenv
-from pprint import pprint
 import os
-import json
-from nodes_relationships import nodes,links
+
+from dotenv import load_dotenv
+from nodes_relationships import links, nodes
+from pymongo import MongoClient
+
 
 def build_lookup_map():
     quick_lookup = {}
     for key in links.keys():
         relationship = links[key]
         source_node = relationship.source
-        lookup_key = str(source_node.id)+":"+str(source_node.type)
-        lookup_content = quick_lookup.get(lookup_key,"empty")
+        lookup_key = str(source_node.id) + ":" + str(source_node.type)
+        lookup_content = quick_lookup.get(lookup_key, "empty")
         if lookup_content != "empty":
             quick_lookup.get(lookup_key).append(relationship)
         else:
             quick_lookup[lookup_key] = [relationship]
     return quick_lookup
 
+
 def create_mongo_documents():
     mongo_documents = []
     quick_lookup = build_lookup_map()
     for key in nodes.keys():
         node = nodes[key]
-        id = str(node.id)+":"+str(node.type)
+        id = str(node.id) + ":" + str(node.type)
         type = node.type
-        rel = quick_lookup.get(id,None)
+        rel = quick_lookup.get(id, None)
         relationships = set()
         targets = {}
-        if rel!=None:
+        if rel is not None:
             for relationship in rel:
-                target_id = str(relationship.target.id)+":"+str(relationship.target.type)
+                target_id = (
+                    str(relationship.target.id) + ":" + str(relationship.target.type)
+                )
                 relationships.add(target_id)
-                target_type = targets.get(target_id,None)
-                if target_type != None:
+                target_type = targets.get(target_id, None)
+                if target_type is not None:
                     targets[target_id].append(relationship.type)
                 else:
                     targets[target_id] = [relationship.type]
-            mongo_documents.append({"_id":id,"type":type,"relationships":list(relationships),"targets":targets})
+            mongo_documents.append(
+                {
+                    "_id": id,
+                    "type": type,
+                    "relationships": list(relationships),
+                    "targets": targets,
+                }
+            )
         else:
-            mongo_documents.append({"_id":id,"type":type,"relationships":[],"targets":{}})
+            mongo_documents.append(
+                {"_id": id, "type": type, "relationships": [], "targets": {}}
+            )
     return mongo_documents
 
+
 def mongo_insert():
     mongo_documents = create_mongo_documents()
     try:
         uri = os.getenv("ATLAS_CONNECTION_STRING")
         print(uri)
-        client = MongoClient(uri)
+        client = MongoClient(uri, appname="devrel.showcase.graph_rag_app")
         database = client["langchain_db"]
         collection = database["nodes_relationships"]
         for doc in mongo_documents:
@@ -58,8 +69,10 @@ def mongo_insert():
         print(e)
     finally:
         client.close()
-if __name__=="__main__":
+
+
+if __name__ == "__main__":
     load_dotenv()
     print("Inserting Documents")
     mongo_insert()
-    print("Successfully Inserted Documents")
+    print("Successfully Inserted Documents")
@@ -1,16 +1,17 @@
-from langchain_core.globals import set_verbose, set_debug
-from langchain_ollama import ChatOllama, OllamaEmbeddings
+import logging
+from typing import Optional
+
+import yaml
 from langchain.schema.output_parser import StrOutputParser
-from langchain_mongodb.vectorstores import MongoDBAtlasVectorSearch
-from pymongo import MongoClient
-from langchain_community.document_loaders import PyPDFLoader
-from langchain.text_splitter import RecursiveCharacterTextSplitter
 from langchain.schema.runnable import RunnablePassthrough
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain_community.document_loaders import PyPDFLoader
 from langchain_community.vectorstores.utils import filter_complex_metadata
+from langchain_core.globals import set_debug, set_verbose
 from langchain_core.prompts import ChatPromptTemplate
-import logging
-import yaml
-
+from langchain_mongodb.vectorstores import MongoDBAtlasVectorSearch
+from langchain_ollama import ChatOllama, OllamaEmbeddings
+from pymongo import MongoClient
 
 # Enable verbose debugging
 set_debug(True)
@@ -20,11 +21,13 @@
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 
+
 def load_config(config_file: str = "config.yaml"):
     """Load configuration from a YAML file."""
-    with open(config_file, "r") as file:
+    with open(config_file) as file:
         return yaml.safe_load(file)
 
+
 class ChatPDF:
     """A class designed for PDF ingestion and question answering using RAG with detailed debugging logs."""
 
@@ -40,29 +43,33 @@ def __init__(self, config_file: str = "config.yaml"):
         mongo_connection_str = config["mongo_connection_str"]
         database_name = config["database_name"]
         collection_name = config["collection_name"]
-        
+
         self.model = ChatOllama(model=llm_model)
         self.embeddings = OllamaEmbeddings(model=embedding_model)
-        self.text_splitter = RecursiveCharacterTextSplitter(chunk_size=1024, chunk_overlap=100)
+        self.text_splitter = RecursiveCharacterTextSplitter(
+            chunk_size=1024, chunk_overlap=100
+        )
         self.prompt = ChatPromptTemplate.from_template(
             """
             You are a helpful assistant answering questions based on the uploaded document and the conversation.
-            
+
             Conversation History:
             {conversation_history}
-            
+
             Context from Documents:
             {context}
-            
+
             Question:
             {question}
-            
+
             Provide a concise, accurate answer (preferably within three sentences), ensuring it directly addresses the question.
             """
         )
-        
+
         # Setup MongoDB connection
-        self.client = MongoClient(mongo_connection_str)
+        self.client = MongoClient(
+            mongo_connection_str, appname="devrel.showcase.local_rag_pdf_app"
+        )
         self.collection = self.client[database_name][collection_name]
 
         # Verbose connection check
@@ -74,7 +81,7 @@ def __init__(self, config_file: str = "config.yaml"):
             collection=self.collection,
             embedding=self.embeddings,
             index_name="vector_index",
-            relevance_score_fn="cosine"
+            relevance_score_fn="cosine",
         )
 
         # Create vector search index on the collection
@@ -107,7 +114,13 @@ def upload_and_index_pdf(self, pdf_file_path: str):
         self.vector_store.add_documents(documents=chunks)
         logger.info("Document embeddings stored successfully in MongoDB Atlas.")
 
-    def query_with_context(self, query: str, conversation_history: list = None, k: int = 5, score_threshold: float = 0.2):
+    def query_with_context(
+        self,
+        query: str,
+        conversation_history: Optional[list] = None,
+        k: int = 5,
+        score_threshold: float = 0.2,
+    ):
         """
         Answer a query using the RAG pipeline with verbose debugging and conversation history.
 
@@ -132,7 +145,9 @@ def query_with_context(self, query: str, conversation_history: list = None, k: i
         # Generate and log query embeddings
         query_embedding = self.embeddings.embed_query(query)
         logger.info(f"User Query: {query}")
-        logger.debug(f"Query Embedding (sample values): {query_embedding[:10]}... [Total Length: {len(query_embedding)}]")
+        logger.debug(
+            f"Query Embedding (sample values): {query_embedding[:10]}... [Total Length: {len(query_embedding)}]"
+        )
 
         logger.info(f"Retrieving context for query: {query}")
         retrieved_docs = self.retriever.invoke(query)
@@ -147,17 +162,19 @@ def query_with_context(self, query: str, conversation_history: list = None, k: i
 
         # Format the input for the LLM, including conversation history
         formatted_input = {
-            "conversation_history": "\n".join(conversation_history) if conversation_history else "",
+            "conversation_history": (
+                "\n".join(conversation_history) if conversation_history else ""
+            ),
             "context": "\n\n".join(doc.page_content for doc in retrieved_docs),
             "question": query,
         }
 
         # Build the RAG chain
         chain = (
             RunnablePassthrough()  # Passes the input as-is
-            | self.prompt           # Formats the input for the LLM
-            | self.model            # Queries the LLM
-            | StrOutputParser()     # Parses the LLM's output
+            | self.prompt  # Formats the input for the LLM
+            | self.model  # Queries the LLM
+            | StrOutputParser()  # Parses the LLM's output
         )
 
         logger.info("Generating response using the LLM.")
 
@@ -0,0 +1 @@
+Miscellaneous collection of guides, code snippets etc.
@@ -0,0 +1,5 @@
+Step-by-step Jupyter Notebook examples on how to use MongoDB as a vector database, data store, memory provider etc. in AI applications.
+
+The easiest way to run these notebooks is in Google Colab by clicking on the [Open In Colab](https://colab.research.google.com/assets/colab-badge.svg) button at the top of the notebook.
+
+Some notebooks also have written articles/tutorials associated with them. To read the article, click the [View Article](https://img.shields.io/badge/View%20Article-blue) at the top of the notebook.
@@ -0,0 +1 @@
+Jupyter Notebooks that cover advanced techniques such as vector quantization, parent document retrieval, hybrid search etc. that can help improve and/or optimize LLM applications.
@@ -435,7 +435,9 @@
     "connection_string = getpass.getpass(\n",
     "    prompt=\"Enter connection string WITH USER + PASS here\"\n",
     ")\n",
-    "client = MongoClient(connection_string)\n",
+    "client = MongoClient(\n",
+    "    connection_string, appname=\"devrel.showcase.geospatial_vector_search\"\n",
+    ")\n",
     "\n",
     "# name your database and collection anything you want since it will be created when you enter your data\n",
     "database = client[\"spritz_summer\"]\n",
 
@@ -110,7 +110,7 @@
    "source": [
     "MONGODB_URI = getpass.getpass(\"Enter your MongoDB URI: \")\n",
     "mongodb_client = MongoClient(\n",
-    "    MONGODB_URI, appname=\"devrel.content.retrieval_strategies_llamaindex\"\n",
+    "    MONGODB_URI, appname=\"devrel.showcase.retrieval_strategies_llamaindex\"\n",
     ")"
    ]
   },
 
@@ -117,7 +117,7 @@
    "source": [
     "MONGODB_URI = getpass.getpass(\"Enter your MongoDB URI: \")\n",
     "mongodb_client = MongoClient(\n",
-    "    MONGODB_URI, appname=\"devrel.content.retrieval_strategies_llamaindex\"\n",
+    "    MONGODB_URI, appname=\"devrel.showcase.retrieval_strategies_llamaindex\"\n",
     ")"
    ]
   },
 
@@ -1571,7 +1571,10 @@
     "doc[\"date\"] = datetime.datetime.now()\n",
     "\n",
     "# Insert JSON reciepe into MongoDB\n",
-    "mongo_client = MongoClient(os.environ[\"MONGO_CONNECTION_STRING\"])\n",
+    "mongo_client = MongoClient(\n",
+    "    os.environ[\"MONGO_CONNECTION_STRING\"],\n",
+    "    appname=\"devrel.showcase.haystack_cooking_agent\",\n",
+    ")\n",
     "db = mongo_client[\"ai_shop\"]\n",
     "collection = db[\"reciepes\"]\n",
     "collection.insert_one(doc)"
 
@@ -0,0 +1 @@
+Jupyter Notebooks showing how to build agentic AI applications using MongoDB's integrations with CrewAI, Haystack, LangGraph, LlamaIndex etc.
@@ -1027,7 +1027,9 @@
     "def get_mongo_client(mongo_uri):\n",
     "    \"\"\"Establish and validate connection to the MongoDB.\"\"\"\n",
     "\n",
-    "    client = pymongo.MongoClient(mongo_uri, appname=\"devrel.showcase.python\")\n",
+    "    client = pymongo.MongoClient(\n",
+    "        mongo_uri, appname=\"devrel.showcase.claude_llamaindex_agent\"\n",
+    "    )\n",
     "\n",
     "    # Validate the connection\n",
     "    ping_result = client.admin.command(\"ping\")\n",
 
@@ -1027,7 +1027,9 @@
     "def get_mongo_client(mongo_uri):\n",
     "    \"\"\"Establish and validate connection to the MongoDB.\"\"\"\n",
     "\n",
-    "    client = pymongo.MongoClient(mongo_uri, appname=\"devrel.showcase.python\")\n",
+    "    client = pymongo.MongoClient(\n",
+    "        mongo_uri, appname=\"devrel.showcase.openai_llamaindex_agent\"\n",
+    "    )\n",
     "\n",
     "    # Validate the connection\n",
     "    ping_result = client.admin.command(\"ping\")\n",
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+Javascript and Python apps and demos showcasing how to use MongoDB in GenAI applications.`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+Miscellaneous collection of guides, code snippets etc.`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+Jupyter Notebooks that cover advanced techniques such as vector quantization, parent document retrieval, hybrid search etc. that can help improve and/or optimize LLM applications.`
Original file line number	Diff line number	Diff line change
`@@ -110,7 +110,7 @@`
`110`	`110`	`"source": [`
`111`	`111`	`"MONGODB_URI = getpass.getpass(\"Enter your MongoDB URI: \")\n",`
`112`	`112`	`"mongodb_client = MongoClient(\n",`
`113`		`- " MONGODB_URI, appname=\"devrel.content.retrieval_strategies_llamaindex\"\n",`
	`113`	`+ " MONGODB_URI, appname=\"devrel.showcase.retrieval_strategies_llamaindex\"\n",`
`114`	`114`	`")"`
`115`	`115`	`]`
`116`	`116`	`},`
Original file line number	Diff line number	Diff line change
`@@ -117,7 +117,7 @@`
`117`	`117`	`"source": [`
`118`	`118`	`"MONGODB_URI = getpass.getpass(\"Enter your MongoDB URI: \")\n",`
`119`	`119`	`"mongodb_client = MongoClient(\n",`
`120`		`- " MONGODB_URI, appname=\"devrel.content.retrieval_strategies_llamaindex\"\n",`
	`120`	`+ " MONGODB_URI, appname=\"devrel.showcase.retrieval_strategies_llamaindex\"\n",`
`121`	`121`	`")"`
`122`	`122`	`]`
`123`	`123`	`},`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+Jupyter Notebooks showing how to build agentic AI applications using MongoDB's integrations with CrewAI, Haystack, LangGraph, LlamaIndex etc.`