> For the complete documentation index, see [llms.txt](https://docs.umbraco.com/llms.txt). Markdown versions of documentation pages are available by appending `.md` to page URLs; this page is available as [Markdown](https://docs.umbraco.com/ai-in-umbraco/17.latest/extending/providers/embedding-capability.md). # Embedding Capability The embedding capability enables vector embedding generation. Implement it by extending `AIEmbeddingCapabilityBase`. ## Base Class {% code title="AIEmbeddingCapabilityBase" %} ```csharp public abstract class AIEmbeddingCapabilityBase(IAIProvider provider) : AICapabilityBase(provider), IAICapability, IAIEmbeddingCapability where TSettings : class { // Override this (or CreateGeneratorAsync) to create an IEmbeddingGenerator protected virtual IEmbeddingGenerator> CreateGenerator( TSettings settings, string? modelId) { /* ... */ } // Override this for an async variant protected virtual Task>> CreateGeneratorAsync( TSettings settings, string? modelId, CancellationToken cancellationToken = default) { /* ... */ } // Implement this: Return available models protected abstract Task> GetModelsAsync( TSettings settings, CancellationToken cancellationToken = default); } ``` {% endcode %} ## Basic Implementation {% code title="MyEmbeddingCapability.cs" %} ```csharp using Microsoft.Extensions.AI; using Umbraco.AI.Core.Models; using Umbraco.AI.Core.Providers; public class MyEmbeddingCapability : AIEmbeddingCapabilityBase { public MyEmbeddingCapability(IAIProvider provider) : base(provider) { } protected override IEmbeddingGenerator> CreateGenerator( MyProviderSettings settings, string? modelId) { return new MyEmbeddingGenerator(settings, modelId ?? "embedding-model"); } protected override Task> GetModelsAsync( MyProviderSettings settings, CancellationToken cancellationToken = default) { var models = new List { new(new AIModelRef(Provider.Id, "embedding-small"), "Embedding Small (1536 dims)"), new(new AIModelRef(Provider.Id, "embedding-large"), "Embedding Large (3072 dims)") }; return Task.FromResult>(models); } } ``` {% endcode %} ## Register in Provider Add the embedding capability in your provider constructor: {% code title="MyProvider.cs" %} ```csharp [AIProvider("myprovider", "My AI Provider")] public class MyProvider : AIProviderBase { public MyProvider(IAIProviderInfrastructure infrastructure) : base(infrastructure) { WithCapability(); WithCapability(); // Add embedding support } } ``` {% endcode %} ## Implementing IEmbeddingGenerator The `IEmbeddingGenerator` interface: {% code title="IEmbeddingGenerator Interface" %} ```csharp public interface IEmbeddingGenerator : IDisposable { EmbeddingGeneratorMetadata Metadata { get; } Task> GenerateAsync( IEnumerable values, EmbeddingGenerationOptions? options = null, CancellationToken cancellationToken = default); object? GetService(Type serviceType, object? serviceKey = null); } ``` {% endcode %} ## Complete IEmbeddingGenerator Example {% code title="MyEmbeddingGenerator.cs" %} ```csharp using System.Text.Json; using Microsoft.Extensions.AI; public class MyEmbeddingGenerator : IEmbeddingGenerator> { private readonly HttpClient _httpClient; private readonly string _modelId; public MyEmbeddingGenerator(MyProviderSettings settings, string modelId) { _modelId = modelId; _httpClient = new HttpClient { BaseAddress = new Uri(settings.BaseUrl ?? "https://api.myprovider.com") }; _httpClient.DefaultRequestHeaders.Add("Authorization", $"Bearer {settings.ApiKey}"); } public EmbeddingGeneratorMetadata Metadata => new( providerName: "MyProvider", providerUri: new Uri("https://myprovider.com"), modelId: _modelId); public async Task>> GenerateAsync( IEnumerable values, EmbeddingGenerationOptions? options = null, CancellationToken cancellationToken = default) { var inputList = values.ToList(); var request = new { model = _modelId, input = inputList }; var response = await _httpClient.PostAsJsonAsync( "/v1/embeddings", request, cancellationToken); response.EnsureSuccessStatusCode(); var result = await response.Content.ReadFromJsonAsync( cancellationToken: cancellationToken); var embeddings = result!.Data .OrderBy(d => d.Index) .Select(d => new Embedding(d.Embedding) { ModelId = result.Model, CreatedAt = DateTimeOffset.UtcNow }) .ToList(); return new GeneratedEmbeddings>(embeddings) { Usage = new UsageDetails { InputTokenCount = result.Usage?.PromptTokens, TotalTokenCount = result.Usage?.TotalTokens } }; } public object? GetService(Type serviceType, object? serviceKey = null) => null; public void Dispose() => _httpClient.Dispose(); } // API response models internal class EmbeddingResponse { public string Model { get; set; } = ""; public List Data { get; set; } = new(); public EmbeddingUsage? Usage { get; set; } } internal class EmbeddingData { public int Index { get; set; } public float[] Embedding { get; set; } = Array.Empty(); } internal class EmbeddingUsage { public int PromptTokens { get; set; } public int TotalTokens { get; set; } } ``` {% endcode %} ## Using Existing M.E.AI Generators If your service has an existing Microsoft.Extensions.AI (M.E.AI) embedding generator: {% code title="Using Existing Generator" %} ```csharp using Microsoft.Extensions.AI; using OpenAI; public class MyOpenAICompatibleEmbeddingCapability : AIEmbeddingCapabilityBase { public MyOpenAICompatibleEmbeddingCapability(IAIProvider provider) : base(provider) { } protected override IEmbeddingGenerator> CreateGenerator( MyProviderSettings settings, string? modelId) { var client = new OpenAIClient(new ApiKeyCredential(settings.ApiKey), new OpenAIClientOptions { Endpoint = new Uri(settings.BaseUrl!) }); return client.AsEmbeddingGenerator(modelId ?? "text-embedding-3-small"); } protected override Task> GetModelsAsync( MyProviderSettings settings, CancellationToken cancellationToken = default) { return Task.FromResult>(new List { new(new AIModelRef(Provider.Id, "text-embedding-3-small"), "Text Embedding 3 Small"), new(new AIModelRef(Provider.Id, "text-embedding-3-large"), "Text Embedding 3 Large") }); } } ``` {% endcode %} ## Handling Batches The `GenerateAsync` method receives multiple inputs. Handle batching appropriately: {% code title="Batch Handling" %} ```csharp public async Task>> GenerateAsync( IEnumerable values, EmbeddingGenerationOptions? options = null, CancellationToken cancellationToken = default) { var inputList = values.ToList(); // Some APIs have batch limits const int maxBatchSize = 100; if (inputList.Count > maxBatchSize) { // Process in chunks var allEmbeddings = new List>(); for (int i = 0; i < inputList.Count; i += maxBatchSize) { var batch = inputList.Skip(i).Take(maxBatchSize); var batchResult = await GenerateBatchAsync(batch, cancellationToken); allEmbeddings.AddRange(batchResult); } return new GeneratedEmbeddings>(allEmbeddings); } return await GenerateBatchAsync(inputList, cancellationToken); } ``` {% endcode %} ## Dimension Information If your API returns dimension information, include it in the model descriptors: {% code title="With Dimensions" %} ```csharp protected override Task> GetModelsAsync( MyProviderSettings settings, CancellationToken cancellationToken = default) { var models = new List { new(new AIModelRef(Provider.Id, "embedding-small"), "Small (1536 dimensions)"), new(new AIModelRef(Provider.Id, "embedding-large"), "Large (3072 dimensions)") }; return Task.FromResult>(models); } ``` {% endcode %} --- # Agent Instructions This documentation is published with GitBook. GitBook is the documentation platform designed so that both humans and AI agents can read, navigate, and reason over technical content effectively. Learn more at gitbook.com. ## Querying This Documentation If you need additional information that is not directly available in this page, you can query the documentation dynamically by asking a question. Perform an HTTP GET request on the current page URL with the `ask` query parameter, and the optional `goal` query parameter: ``` GET https://docs.umbraco.com/ai-in-umbraco/17.latest/extending/providers/embedding-capability.md?ask=&goal= ``` `ask` is the immediate question: it should be specific, self-contained, and written in natural language. `goal` is optional and describes the broader end goal you are ultimately trying to accomplish on behalf of the user. GitBook uses it to tailor the answer towards what is most useful for that goal. The response will contain a direct answer to the question and relevant excerpts and sources from the documentation. Use this mechanism when the answer is not explicitly present in the current page, you need clarification or additional context, or you want to retrieve related documentation sections.