mongodb-js
diff --git a/‎.vscode/launch.json‎
Lines changed: 7 additions & 0 deletions b/‎.vscode/launch.json‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 0 additions & 1 deletion b/‎README.md‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎package.json‎
Lines changed: 1 addition & 1 deletion b/‎package.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/tools/args.ts‎
Lines changed: 1 addition & 0 deletions b/‎src/tools/args.ts‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/tools/mongodb/create/createIndex.ts‎
Lines changed: 152 additions & 61 deletions b/‎src/tools/mongodb/create/createIndex.ts‎
Lines changed: 152 additions & 61 deletions
diff --git a/‎src/tools/mongodb/read/aggregate.ts‎
Lines changed: 7 additions & 3 deletions b/‎src/tools/mongodb/read/aggregate.ts‎
Lines changed: 7 additions & 3 deletions
diff --git a/‎tests/accuracy/aggregate.test.ts‎
Lines changed: 23 additions & 0 deletions b/‎tests/accuracy/aggregate.test.ts‎
Lines changed: 23 additions & 0 deletions
@@ -4,6 +4,13 @@
   // For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387
   "version": "0.2.0",
   "configurations": [
+    {
+      "name": "Attach by Process ID",
+      "processId": "${command:PickProcess}",
+      "request": "attach",
+      "skipFiles": ["<node_internals>/**"],
+      "type": "node"
+    },
     {
       "type": "node",
       "request": "launch",
 
@@ -669,7 +669,6 @@ npx -y mongodb-mcp-server@latest --logPath=/path/to/logs --readOnly --indexCheck
       "args": [
         "-y",
         "mongodb-mcp-server",
-        "--connectionString",
         "mongodb+srv://username:password@cluster.mongodb.net/myDatabase",
         "--readOnly"
       ]
 
@@ -44,7 +44,7 @@
     "dist"
   ],
   "scripts": {
-    "start": "node dist/index.js --transport http --loggers stderr mcp",
+    "start": "node dist/index.js --transport http --loggers stderr mcp --previewFeatures vectorSearch",
     "start:stdio": "node dist/index.js --transport stdio --loggers stderr mcp",
     "prepare": "husky && pnpm run build",
     "build:clean": "rm -rf dist",
 
@@ -18,6 +18,7 @@ export const ALLOWED_CLUSTER_NAME_CHARACTERS_ERROR =
 const ALLOWED_PROJECT_NAME_CHARACTERS_REGEX = /^[a-zA-Z0-9\s()@&+:._',-]+$/;
 export const ALLOWED_PROJECT_NAME_CHARACTERS_ERROR =
     "Project names can't be longer than 64 characters and can only contain letters, numbers, spaces, and the following symbols: ( ) @ & + : . _ - ' ,";
+
 export const CommonArgs = {
     string: (): ZodString => z.string().regex(NO_UNICODE_REGEX, NO_UNICODE_ERROR),
 
 
@@ -7,62 +7,129 @@ import { quantizationEnum } from "../../../common/search/vectorSearchEmbeddingsM
 import { similarityValues } from "../../../common/schemas.js";
 
 export class CreateIndexTool extends MongoDBToolBase {
-    private vectorSearchIndexDefinition = z.object({
-        type: z.literal("vectorSearch"),
-        fields: z
-            .array(
-                z.discriminatedUnion("type", [
-                    z
-                        .object({
-                            type: z.literal("filter"),
-                            path: z
-                                .string()
-                                .describe(
-                                    "Name of the field to index. For nested fields, use dot notation to specify path to embedded fields"
-                                ),
-                        })
-                        .strict()
-                        .describe("Definition for a field that will be used for pre-filtering results."),
-                    z
-                        .object({
-                            type: z.literal("vector"),
-                            path: z
-                                .string()
-                                .describe(
-                                    "Name of the field to index. For nested fields, use dot notation to specify path to embedded fields"
-                                ),
-                            numDimensions: z
-                                .number()
-                                .min(1)
-                                .max(8192)
-                                .default(this.config.vectorSearchDimensions)
-                                .describe(
-                                    "Number of vector dimensions that MongoDB Vector Search enforces at index-time and query-time"
-                                ),
-                            similarity: z
-                                .enum(similarityValues)
-                                .default(this.config.vectorSearchSimilarityFunction)
-                                .describe(
-                                    "Vector similarity function to use to search for top K-nearest neighbors. You can set this field only for vector-type fields."
-                                ),
-                            quantization: quantizationEnum
-                                .default("none")
+    private vectorSearchIndexDefinition = z
+        .object({
+            type: z.literal("vectorSearch"),
+            fields: z
+                .array(
+                    z.discriminatedUnion("type", [
+                        z
+                            .object({
+                                type: z.literal("filter"),
+                                path: z
+                                    .string()
+                                    .describe(
+                                        "Name of the field to index. For nested fields, use dot notation to specify path to embedded fields"
+                                    ),
+                            })
+                            .strict()
+                            .describe("Definition for a field that will be used for pre-filtering results."),
+                        z
+                            .object({
+                                type: z.literal("vector"),
+                                path: z
+                                    .string()
+                                    .describe(
+                                        "Name of the field to index. For nested fields, use dot notation to specify path to embedded fields"
+                                    ),
+                                numDimensions: z
+                                    .number()
+                                    .min(1)
+                                    .max(8192)
+                                    .default(this.config.vectorSearchDimensions)
+                                    .describe(
+                                        "Number of vector dimensions that MongoDB Vector Search enforces at index-time and query-time"
+                                    ),
+                                similarity: z
+                                    .enum(similarityValues)
+                                    .default(this.config.vectorSearchSimilarityFunction)
+                                    .describe(
+                                        "Vector similarity function to use to search for top K-nearest neighbors. You can set this field only for vector-type fields."
+                                    ),
+                                quantization: quantizationEnum
+                                    .default("none")
+                                    .describe(
+                                        "Type of automatic vector quantization for your vectors. Use this setting only if your embeddings are float or double vectors."
+                                    ),
+                            })
+                            .strict()
+                            .describe("Definition for a field that contains vector embeddings."),
+                    ])
+                )
+                .nonempty()
+                .refine((fields) => fields.some((f) => f.type === "vector"), {
+                    message: "At least one vector field must be defined",
+                })
+                .describe(
+                    "Definitions for the vector and filter fields to index, one definition per document. You must specify `vector` for fields that contain vector embeddings and `filter` for additional fields to filter on. At least one vector-type field definition is required."
+                ),
+        })
+        .describe("Definition for a Vector Search index.");
+
+    private atlasSearchIndexDefinition = z
+        .object({
+            type: z.literal("search"),
+            analyzer: z
+                .string()
+                .optional()
+                .default("lucene.standard")
+                .describe(
+                    "The analyzer to use for the index. Can be one of the built-in lucene analyzers (`lucene.standard`, `lucene.simple`, `lucene.whitespace`, `lucene.keyword`), a language-specific analyzer, such as `lucene.cjk` or `lucene.czech`, or a custom analyzer defined in the Atlas UI."
+                ),
+            mappings: z
+                .object({
+                    dynamic: z
+                        .boolean()
+                        .optional()
+                        .default(false)
+                        .describe(
+                            "Enables or disables dynamic mapping of fields for this index. If set to true, Atlas Search recursively indexes all dynamically indexable fields. If set to false, you must specify individual fields to index using mappings.fields."
+                        ),
+                    fields: z
+                        .record(
+                            z.string().describe("The field name"),
+                            z
+                                .object({
+                                    type: z
+                                        .enum([
+                                            "autocomplete",
+                                            "boolean",
+                                            "date",
+                                            "document",
+                                            "embeddedDocuments",
+                                            "geo",
+                                            "number",
+                                            "objectId",
+                                            "string",
+                                            "token",
+                                            "uuid",
+                                        ])
+                                        .describe("The field type"),
+                                })
+                                .passthrough()
                                 .describe(
-                                    "Type of automatic vector quantization for your vectors. Use this setting only if your embeddings are float or double vectors."
-                                ),
-                        })
-                        .strict()
-                        .describe("Definition for a field that contains vector embeddings."),
-                ])
-            )
-            .nonempty()
-            .refine((fields) => fields.some((f) => f.type === "vector"), {
-                message: "At least one vector field must be defined",
-            })
-            .describe(
-                "Definitions for the vector and filter fields to index, one definition per document. You must specify `vector` for fields that contain vector embeddings and `filter` for additional fields to filter on. At least one vector-type field definition is required."
-            ),
-    });
+                                    "The field index definition. It must contain the field type, as well as any additional options for that field type."
+                                )
+                        )
+                        .optional()
+                        .describe("The field mapping definitions. If `dynamic` is set to `false`, this is required."),
+                })
+                .refine((data) => data.dynamic !== !!(data.fields && Object.keys(data.fields).length > 0), {
+                    message:
+                        "Either `dynamic` must be `true` and `fields` empty or `dynamic` must be `false` and at least one field must be defined in `fields`",
+                })
+                .describe(
+                    "Document describing the index to create. Either `dynamic` must be `true` and `fields` empty or `dynamic` must be `false` and at least one field must be defined in the `fields` document."
+                ),
+            numPartitions: z
+                .union([z.literal("1"), z.literal("2"), z.literal("4")])
+                .default("1")
+                .transform((value): number => Number.parseInt(value))
+                .describe(
+                    "Specifies the number of sub-indexes to create if the document count exceeds two billion. If omitted, defaults to 1."
+                ),
+        })
+        .describe("Definition for an Atlas Search (lexical) index.");
 
     public name = "create-index";
     protected description = "Create an index for a collection";
@@ -72,15 +139,19 @@ export class CreateIndexTool extends MongoDBToolBase {
         definition: z
             .array(
                 z.discriminatedUnion("type", [
-                    z.object({
-                        type: z.literal("classic"),
-                        keys: z.object({}).catchall(z.custom<IndexDirection>()).describe("The index definition"),
-                    }),
-                    ...(this.isFeatureEnabled("search") ? [this.vectorSearchIndexDefinition] : []),
+                    z
+                        .object({
+                            type: z.literal("classic"),
+                            keys: z.object({}).catchall(z.custom<IndexDirection>()).describe("The index definition"),
+                        })
+                        .describe("Definition for a MongoDB index (e.g. ascending/descending/geospatial)."),
+                    ...(this.isFeatureEnabled("search")
+                        ? [this.vectorSearchIndexDefinition, this.atlasSearchIndexDefinition]
+                        : []),
                 ])
             )
             .describe(
-                `The index definition. Use 'classic' for standard indexes${this.isFeatureEnabled("search") ? " and 'vectorSearch' for vector search indexes" : ""}.`
+                `The index definition. Use 'classic' for standard indexes${this.isFeatureEnabled("search") ? ", 'vectorSearch' for vector search indexes, and 'search' for Atlas Search (lexical) indexes" : ""}.`
             ),
     };
 
@@ -130,6 +201,26 @@ export class CreateIndexTool extends MongoDBToolBase {
                     this.session.vectorSearchEmbeddingsManager.cleanupEmbeddingsForNamespace({ database, collection });
                 }
 
+                break;
+            case "search":
+                {
+                    await this.ensureSearchIsSupported();
+                    indexes = await provider.createSearchIndexes(database, collection, [
+                        {
+                            name,
+                            definition: {
+                                mappings: definition.mappings,
+                                analyzer: definition.analyzer,
+                                numPartitions: definition.numPartitions,
+                            },
+                            type: "search",
+                        },
+                    ]);
+
+                    responseClarification =
+                        " Since this is a search index, it may take a while for the index to build. Use the `list-indexes` tool to check the index status.";
+                }
+
                 break;
         }
 
 
@@ -20,7 +20,8 @@ import {
 
 const pipelineDescriptionWithVectorSearch = `\
 An array of aggregation stages to execute.
-\`$vectorSearch\` **MUST** be the first stage of the pipeline, or the first stage of a \`$unionWith\` subpipeline.
+If the user has asked for a vector search, \`$vectorSearch\` **MUST** be the first stage of the pipeline, or the first stage of a \`$unionWith\` subpipeline.
+If the user has asked for lexical/Atlas search, use \`$search\` instead of \`$text\`.
 ### Usage Rules for \`$vectorSearch\`
 - **Unset embeddings:**
   Unless the user explicitly requests the embeddings, add an \`$unset\` stage **at the end of the pipeline** to remove the embedding field and avoid context limits. **The $unset stage in this situation is mandatory**.
@@ -29,9 +30,12 @@ If the user requests additional filtering, include filters in \`$vectorSearch.fi
     NEVER include fields in $vectorSearch.filter that are not part of the vector index.
 - **Post-filtering:**
     For all remaining filters, add a $match stage after $vectorSearch.
-### Note to LLM
 - If unsure which fields are filterable, use the collection-indexes tool to determine valid prefilter fields.
-- If no requested filters are valid prefilters, omit the filter key from $vectorSearch.\
+- If no requested filters are valid prefilters, omit the filter key from $vectorSearch.
+
+### Usage Rules for \`$search\`
+- Include the index name, unless you know for a fact there's a default index. If unsure, use the collection-indexes tool to determine the index name.
+- The \`$search\` stage supports multiple operators, such as 'autocomplete', 'text', 'geoWithin', and others. Choose the approprate operator based on the user's query. If unsure of the exact syntax, consult the MongoDB Atlas Search documentation, which can be found here: https://www.mongodb.com/docs/atlas/atlas-search/operators-and-collectors/
 `;
 
 const genericPipelineDescription = "An array of aggregation stages to execute.";
 
@@ -421,4 +421,27 @@ describeAccuracyTests([
             },
         },
     },
+    {
+        prompt: "Run a $search query on mflix.movies to find all movies that mention 'space travel' in the plot or title. Use the default search index.",
+        expectedToolCalls: [
+            {
+                toolName: "aggregate",
+                parameters: {
+                    database: "mflix",
+                    collection: "movies",
+                    pipeline: [
+                        {
+                            $search: {
+                                index: Matcher.anyOf(Matcher.undefined, Matcher.value("default")),
+                                text: {
+                                    query: "space travel",
+                                    path: ["plot", "title"],
+                                },
+                            },
+                        },
+                    ],
+                },
+            },
+        ],
+    },
 ]);
Original file line number	Diff line number	Diff line change
`@@ -669,7 +669,6 @@ npx -y mongodb-mcp-server@latest --logPath=/path/to/logs --readOnly --indexCheck`
`669`	`669`	`"args": [`
`670`	`670`	`"-y",`
`671`	`671`	`"mongodb-mcp-server",`
`672`		`- "--connectionString",`
`673`	`672`	`"mongodb+srv://username:password@cluster.mongodb.net/myDatabase",`
`674`	`673`	`"--readOnly"`
`675`	`674`	`]`