From 9c3da4291c927f0aae0611f3e0f8b5ca6459297c Mon Sep 17 00:00:00 2001 From: Christian Gick Date: Thu, 19 Feb 2026 15:18:56 +0000 Subject: [PATCH] feat: Add Infinity rerank container with bge-reranker-base (CF-1317) Local cross-encoder rerank service using BAAI/bge-reranker-base model via michaelf34/infinity:0.0.68. Serves /rerank endpoint on port 7998 for LiteLLM proxy integration. Co-Authored-By: Claude Opus 4.6 --- docker-compose.yml | 25 +++++++++++++++++++++++++ 1 file changed, 25 insertions(+) create mode 100644 docker-compose.yml diff --git a/docker-compose.yml b/docker-compose.yml new file mode 100644 index 0000000..66de85f --- /dev/null +++ b/docker-compose.yml @@ -0,0 +1,25 @@ +services: + infinity-rerank: + image: michaelf34/infinity:0.0.68 + container_name: infinity-rerank + command: v2 --model-id BAAI/bge-reranker-base --port 7998 --engine torch + ports: + - "7998:7998" + volumes: + - infinity-data:/app/.cache + environment: + - DO_NOT_TRACK=1 + restart: unless-stopped + deploy: + resources: + limits: + memory: 4G + networks: + - agiliton-api + +volumes: + infinity-data: + +networks: + agiliton-api: + external: true