From 989a170a78c19129a4403e1932327b4b09d622bd Mon Sep 17 00:00:00 2001 From: Clawdbot Date: Fri, 30 Jan 2026 03:37:52 +0000 Subject: [PATCH] Switch to bge-base-en-v1.5 (512 token context) --- README.md | 6 +++--- deployment.yaml | 2 +- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/README.md b/README.md index ea3183c..57c9608 100644 --- a/README.md +++ b/README.md @@ -6,7 +6,7 @@ Lightweight embedding service for Clawdbot memory search. Runs [HuggingFace Text Embeddings Inference](https://github.com/huggingface/text-embeddings-inference) (TEI) on CPU to provide OpenAI-compatible embeddings for semantic memory search. -- **Model:** `sentence-transformers/all-MiniLM-L6-v2` (~90MB, 384 dimensions) +- **Model:** `BAAI/bge-base-en-v1.5` (~440MB, 768 dimensions, 512 token context) - **Endpoint:** `http://text-embeddings:8080/v1/embeddings` - **No GPU required** @@ -28,7 +28,7 @@ Add to `~/.clawdbot/clawdbot.json`: "memorySearch": { "enabled": true, "provider": "openai", - "model": "sentence-transformers/all-MiniLM-L6-v2", + "model": "BAAI/bge-base-en-v1.5", "remote": { "baseUrl": "http://text-embeddings.tei.svc.cluster.local:8080/v1/", "apiKey": "not-needed" @@ -50,5 +50,5 @@ Add to `~/.clawdbot/clawdbot.json`: ```bash curl -X POST http://text-embeddings:8080/v1/embeddings \ -H "Content-Type: application/json" \ - -d '{"input": "Hello world", "model": "sentence-transformers/all-MiniLM-L6-v2"}' + -d '{"input": "Hello world", "model": "BAAI/bge-base-en-v1.5"}' ``` diff --git a/deployment.yaml b/deployment.yaml index 940aac2..fdf2bde 100644 --- a/deployment.yaml +++ b/deployment.yaml @@ -33,7 +33,7 @@ spec: image: ghcr.io/huggingface/text-embeddings-inference:cpu-1.6 args: - --model-id - - sentence-transformers/all-MiniLM-L6-v2 + - BAAI/bge-base-en-v1.5 - --port - "8080" ports: