Azure · ajtiwari07 · Feb 3, 2026 · Feb 3, 2026 · Feb 3, 2026 · Feb 3, 2026
@@ -770,6 +770,195 @@
               "default": 4
             }
           }
+        },
+        "embeddings": {
+          "type": "object",
+          "description": "Configuration for text embedding/vectorization service. Supports OpenAI and Azure OpenAI providers.",
+          "additionalProperties": false,
+          "properties": {
+            "enabled": {
+              "type": "boolean",
+              "description": "Whether the embedding service is enabled. Defaults to true.",
+              "default": true
+            },
+            "provider": {
+              "type": "string",
+              "description": "The embedding provider type.",
+              "enum": ["azure-openai", "openai"]
+            },
+            "base-url": {
+              "type": "string",
+              "description": "The provider base URL. For Azure OpenAI, use the Azure resource endpoint. For OpenAI, use https://api.openai.com."
+            },
+            "api-key": {
+              "type": "string",
+              "description": "The API key for authentication. Supports environment variable substitution with @env('VAR_NAME')."
+            },
+            "model": {
+              "type": "string",
+              "description": "The model or deployment name. Required for Azure OpenAI (deployment name). For OpenAI, defaults to 'text-embedding-3-small' if not specified."
+            },
+            "api-version": {
+              "type": "string",
+              "description": "Azure API version. Only used for Azure OpenAI provider.",
+              "default": "2023-05-15"
+            },
+            "dimensions": {
+              "type": "integer",
+              "description": "Output vector dimensions. Defaults to 1536 if not specified. Useful for Redis schema alignment.",
+              "default": 1536,
+              "minimum": 1
+            },
+            "timeout-ms": {
+              "type": "integer",
+              "description": "Request timeout in milliseconds.",
+              "default": 30000,
+              "minimum": 1,
+              "maximum": 300000
+            },
+            "endpoint": {
+              "type": "object",
+              "description": "REST endpoint configuration for the embedding service.",
+              "additionalProperties": false,
+              "properties": {
+                "enabled": {
+                  "type": "boolean",
+                  "description": "Whether the /embed REST endpoint is enabled. Defaults to false.",
+                  "default": false
+                },
+                "path": {
+                  "type": "string",
+                  "description": "The URL path for the embedding endpoint. Defaults to '/embed'.",
+                  "default": "/embed"
+                },
+                "roles": {
+                  "type": "array",
+                  "description": "The roles allowed to access the embedding endpoint. Defaults to ['authenticated'].",
+                  "default": ["authenticated"],
+                  "items": {
+                    "type": "string"
+                  }
+                }
+              }
+            },
+            "health": {
+              "type": "object",
+              "description": "Health check configuration for the embedding service.",
+              "additionalProperties": false,
+              "properties": {
+                "enabled": {
+                  "type": "boolean",
+                  "description": "Whether health checks are enabled for embeddings. Defaults to false.",
+                  "default": false
+                },
+                "threshold-ms": {
+                  "type": "integer",
+                  "description": "The maximum response time in milliseconds to be considered healthy.",
+                  "default": 1000,
+                  "minimum": 1,
+                  "maximum": 300000
+                },
+                "test-text": {
+                  "type": "string",
+                  "description": "The text to use for health check validation.",
+                  "default": "health check"
+                },
+                "expected-dimensions": {
+                  "type": "integer",
+                  "description": "The expected number of dimensions in the embedding result. If specified, dimension validation is performed.",
+                  "minimum": 1
+                }
+              }
+            },
+            "cache": {
+              "type": "object",
+              "description": "Cache configuration for embedding results.",
+              "additionalProperties": false,
+              "properties": {
+                "enabled": {
+                  "type": "boolean",
+                  "description": "Whether caching is enabled for embeddings. Defaults to true.",
+                  "default": true
+                },
+                "level": {
+                  "type": "string",
+                  "description": "Cache level (L1 for in-memory only, L1L2 for in-memory + distributed). Defaults to L1.",
+                  "enum": ["L1", "L1L2"],
+                  "default": "L1"
+                },
+                "ttl-seconds": {
+                  "type": "integer",
+                  "description": "Time-to-live for cached embeddings in seconds. Defaults to 86400 (24 hours).",
+                  "default": 86400,
+                  "minimum": 1
+                }
+              }
+            },
+            "chunking": {
+              "type": "object",
+              "description": "Chunking configuration for text processing before embedding. Used to split large text inputs into smaller chunks.",
+              "additionalProperties": false,
+              "properties": {
+                "enabled": {
+                  "type": "boolean",
+                  "description": "Whether chunking is enabled. Defaults to true.",
+                  "default": true
+                },
+                "size-chars": {
+                  "type": "integer",
+                  "description": "The size of each chunk in characters.",
+                  "default": 800,
+                  "minimum": 1
+                },
+                "overlap-chars": {
+                  "type": "integer",
+                  "description": "The number of characters to overlap between consecutive chunks. Overlap helps maintain context across chunk boundaries.",
+                  "default": 100,
+                  "minimum": 0
+                }
+              }
+            }
+          },
+          "required": ["provider", "base-url", "api-key"],
+          "allOf": [
+            {
+              "$comment": "Azure OpenAI requires the model (deployment name) to be specified.",
+              "if": {
+                "properties": {
+                  "provider": {
+                    "const": "azure-openai"
+                  }
+                },
+                "required": ["provider"]
+              },
+              "then": {
+                "required": ["model"],
+                "properties": {
+                  "api-version": {
+                    "type": "string",
+                    "description": "Azure API version. Required for Azure OpenAI provider.",
+                    "default": "2023-05-15"
+                  }
+                }
+              }
+            },
+            {
+              "$comment": "OpenAI does not require model (defaults to text-embedding-3-small) and does not use api-version.",
+              "if": {
+                "properties": {
+                  "provider": {
+                    "const": "openai"
+                  }
+                },
+                "required": ["provider"]
+              },
+              "then": {
+                "properties": {
+                  "api-version": false
+                }
+              }
+            }
+          ]
         }
       }
     },