Files
steve b5a203d2aa Add bulk operations and remove collections abstraction
- Add bulk delete, bulk tags, and bulk set-tags engine endpoints
  (POST /api/v1/bulk/delete, /bulk/tags, /bulk/set-tags)
- Filter-based selection: by tags, doc_type, ID list, ID range
- Safety threshold (KB_BULK_SAFETY_PERCENT, default 70%) prevents
  accidental mass operations unless force=true
- Synchronous execution with audit trail via jobs table
- Add kb_bulk_delete, kb_bulk_tags, kb_bulk_set_tags MCP tools
- Add kb bulk-remove, bulk-tag, bulk-set-tags CLI commands
- Remove collection abstraction from MCP server (use tags instead)
- Remove kb_set_collection MCP tool
- Update SKILL.md, MCP.md, README.md documentation

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-04-04 22:34:47 +01:00

70 lines
1.8 KiB
Python

"""Engine entry point — FastAPI server with eager model loading."""
import asyncio
import logging
import os
from contextlib import asynccontextmanager
from pathlib import Path
from fastapi import FastAPI
_version_file = Path(__file__).parent / "VERSION"
__version__ = _version_file.read_text().strip() if _version_file.exists() else "dev"
from kb.config import cfg
from kb.embeddings import load_model
from kb.database import get_connection, init_schema
from kb.worker import ingestion_worker
logging.basicConfig(level=logging.INFO, format="%(asctime)s %(levelname)s %(message)s")
log = logging.getLogger("kb.engine")
# Track readiness for health endpoint
ready = False
worker_task: asyncio.Task | None = None
@asynccontextmanager
async def lifespan(app: FastAPI):
global ready, worker_task
# Set HF cache before any model imports
os.environ["HF_HOME"] = str(cfg.hf_cache)
log.info("Starting engine...")
cfg.ensure_dirs()
# Initialise database
conn = get_connection(cfg.db_path)
model_dim = load_model(cfg.model, cfg.device)
init_schema(conn, model_dim)
conn.close()
# Start background ingestion worker
worker_task = asyncio.create_task(ingestion_worker())
ready = True
log.info("Engine ready — model: %s, device: %s", cfg.model, cfg.device)
yield
# Shutdown
ready = False
if worker_task:
worker_task.cancel()
try:
await worker_task
except asyncio.CancelledError:
pass
log.info("Engine stopped.")
app = FastAPI(title="kb-engine", version=__version__, lifespan=lifespan)
# Import routes after app is created
from kb.routes import health, search, jobs, documents, tags, status, reindex, auth, notes, bulk # noqa: E402, F401
if __name__ == "__main__":
import uvicorn
uvicorn.run("main:app", host=cfg.host, port=cfg.port, log_level="info")