modelBuilder.HasPostgresExtension("vector"); modelBuilder.Entity<TextEmbedding>(entity => { entity.HasKey(e => e.Id); entity.Property(e => e.Content).IsRequired(); // all-minilm produces 384-dimensional vectors entity.Property(e => e.Embedding).HasColumnType("vector(384)"); entity.Property(e => e.CreatedAt).IsRequired(); // Add index for vector similarity search entity.HasIndex(e => e.Embedding) .HasMethod("ivfflat") .HasOperators("vector_cosine_ops"); });

services.AddSingleton<IEmbeddingGenerator<string, Embedding<float>>>(sp => { var modelId = builder.Configuration["Ollama:EmbeddingModel"]; var baseUrl = builder.Configuration["Ollama:BaseUrl"]; return new OllamaApiClient(baseUrl, modelId); });

app.MapPost("/text", async ( Text[] request, EmbeddingDbContext context, IEmbeddingGenerator<string, Embedding<float>> embeddingService) => { // Convert request to vectors var embeddings = await embeddingService.GenerateAsync( request.Select(s => s.Content) ); var dbModels = embeddings.Select((embedding, index) => new TextEmbedding { Content = request[index].Content, Embedding = new Vector(embedding.Vector), CreatedAt = DateTime.UtcNow }).ToList(); context.AddRange(dbModels); await context.SaveChangesAsync(); return TypedResults.Created(); });

app.MapGet("/text/search", async ( string query, EmbeddingDbContext context, IEmbeddingGenerator<string, Embedding<float>> embeddingService) => { int limit = 5; // Convert query to vector var embeddings = await embeddingService.GenerateAsync(query); var queryEmbedding = new Vector(embeddings.Vector); // Find most similar texts using cosine distance var similarTexts = await context.TextEmbeddings .OrderBy(x => x.Embedding.CosineDistance(queryEmbedding)) .Select(x => new Text(x.Content)) .Take(limit) .ToListAsync(); return TypedResults.Ok(similarTexts); });

ollama: image: ollama/ollama:latest container_name: ollama ports: - "11434:11434" entrypoint: - "/bin/bash" - "-c" - "ollama serve & sleep 5 && ollama pull all-minilm && wait" environment: - OLLAMA_KEEP_ALIVE="24h" volumes: - ollama_data:/root/.ollama

Architecture

flowchart LR
    subgraph Architecture
        API[API .NET]
        DB[(PostgreSQL using pgvector)]
        OLLAMA[Ollama LLM]
        MIGRATIONS[EF Migrations]
    end
    API <--> DB
    API <--> OLLAMA
    MIGRATIONS --> DB

API Endpoints

Method	Endpoint	Description
GET	/text	List first 20 texts
POST	/text	Add texts (array of { content })
GET	/text/search	Vector search (?query=...)

Testing the API

You can use the provided .http file to easily test the API endpoints directly from Visual Studio Code or other compatible tools. This file contains example requests for adding, searching, and listing texts.

EmbeddingPoC

A proof-of-concept .NET API for text embedding and semantic search using PostgreSQL with pgvector and Ollama for embedding generation.

Features

Store and retrieve text embeddings in PostgreSQL using Entity Framework Core and pgvector.
Generate embeddings via Ollama API.
REST endpoints for:
- Adding new texts and their embeddings.
- Searching for similar texts using vector similarity.
- Listing stored texts.

Usage

Simply run:

docker-compose up --build

…

DEV Community

How to Build Semantic Search in ASP.NET Core using PostgreSQL

Database side

Application part

1. Register the embedding service.

2. Create an endpoint to convert text to vectors and store them

3. The magic happens here - semantic search using cosine similarity

Test local

Conclusion

ohalay / embedeting-poc