feat(03-03): wire get_current_user into /api/topics/*; add load_topics_for_user; POST /api/admin/topics

- api/topics.py: add get_current_user dep to all 5 handlers (list, create, update, delete, suggest) - list_topics: uses load_topics_for_user (system topics + user's own) with user-scoped doc counts - create_topic: passes user_id=current_user.id (never creates system topics via regular endpoint) - update_topic/delete_topic: ownership assertion — system topics and other users' topics return 404 - api/admin.py: add SystemTopicCreate model + POST /api/admin/topics (user_id=NULL, admin-only) - services/storage.py: add or_ import; load_topics_for_user (D-17); create_topic gains user_id param with namespace-scoped dedup; topic_doc_counts gains optional user_id for user-scoped counts; add load_topics_for_user to __all__ - services/classifier.py: replace load_topics with load_topics_for_user(doc.user_id); pass user_id=doc.user_id to create_topic for AI-suggested topics (D-11) - Tests: update all topic tests to pass auth headers; implement test_topic_namespace, test_admin_create_system_topic, test_regular_user_cannot_create_system_topic, test_topics_require_auth
2026-05-23 20:15:44 +02:00
parent b28bb01995
commit 5950a3f5c2
5 changed files with 292 additions and 55 deletions
@@ -5,11 +5,18 @@ Loads settings, selects AI provider, classifies document, auto-creates suggested
 Updated in Plan 05: classify_document and suggest_topics_for_document now accept
 an AsyncSession as their first argument so they can be called from the Celery task
 wrapper and from API route handlers that already hold a session.
+
+Updated in Plan 03-03: classify_document uses load_topics_for_user (D-17) to scope
+topic lookup to the document owner's namespace, and creates AI-suggested topics in
+the user's namespace via create_topic(user_id=doc.user_id) (D-11).
 """
 from __future__ import annotations

+import uuid as _uuid
+
 from sqlalchemy.ext.asyncio import AsyncSession

+from db.models import Document
 from services import storage
 from ai import get_provider

@@ -24,7 +31,7 @@ async def classify_document(
    """
    Classify a document by its ID. Returns the list of assigned topic names.
    If topic_names is provided, restrict classification to those topics.
-    Auto-creates any newly suggested topics.
+    Auto-creates any newly suggested topics in the document owner's namespace (D-11).
    """
    meta = await storage.get_metadata(session, doc_id)
    if meta is None:
@@ -34,9 +41,22 @@ async def classify_document(
    system_prompt = settings.get("system_prompt", "")
    provider = get_provider(settings)

-    # Use all known topics if not specified
+    # Load the Document ORM object to get the owner's user_id (D-11, D-17)
+    try:
+        uid = _uuid.UUID(doc_id)
+    except ValueError:
+        uid = None
+
+    doc = await session.get(Document, uid) if uid is not None else None
+    doc_user_id = doc.user_id if doc is not None else None
+
+    # Use namespace-scoped topic list if not specified (D-17)
    if topic_names is None:
-        all_topics = await storage.load_topics(session)
+        if doc_user_id is not None:
+            all_topics = await storage.load_topics_for_user(session, user_id=doc_user_id)
+        else:
+            # Fallback for documents without a user (legacy / test data)
+            all_topics = await storage.load_topics(session)
        topic_names = [t["name"] for t in all_topics]

    text = meta.get("extracted_text", "")
@@ -45,11 +65,11 @@ async def classify_document(
    # Collect all topic names to persist (assigned + suggested)
    all_new_names = set(result.suggested_new_topics) | set(result.topics)

-    # Auto-create any topic not already in the registry
+    # Auto-create any topic not already in the registry — in the user's namespace (D-11)
    existing_names = {t.lower() for t in topic_names}
    for name in all_new_names:
        if name.strip() and name.lower() not in existing_names:
-            await storage.create_topic(session, name.strip())
+            await storage.create_topic(session, name.strip(), user_id=doc_user_id)

    # Final list: everything the AI assigned or suggested
    final_topics = [t for t in list(set(result.topics + result.suggested_new_topics)) if t.strip()]
@@ -28,7 +28,7 @@ import uuid
 from datetime import datetime, timezone
 from typing import Optional

-from sqlalchemy import select, delete, text
+from sqlalchemy import select, delete, text, or_
 from sqlalchemy import func as sql_func
 from sqlalchemy.ext.asyncio import AsyncSession

@@ -258,6 +258,24 @@ async def load_topics(session: AsyncSession) -> list:
    ]


+async def load_topics_for_user(session: AsyncSession, user_id: uuid.UUID) -> list:
+    """Return system topics (user_id IS NULL) + the user's own topics, ordered by name.
+
+    D-08 + D-17 + DOC-04: layered topic namespace. System topics are visible to all
+    users; per-user topics are visible only to their owner. A user's topic list is
+    the union of both sets.
+    """
+    q = await session.execute(
+        select(Topic).where(
+            or_(Topic.user_id == user_id, Topic.user_id.is_(None))
+        ).order_by(Topic.name)
+    )
+    return [
+        {"id": str(t.id), "name": t.name, "description": t.description, "color": t.color}
+        for t in q.scalars()
+    ]
+
+
 async def save_topics(session: AsyncSession, topics: list) -> None:
    """Idempotent bulk replace — delete all Topic rows then insert the list.

@@ -293,11 +311,35 @@ async def create_topic(
    name: str,
    description: str = "",
    color: str = "#6366f1",
+    user_id: Optional[uuid.UUID] = None,
 ) -> dict:
-    """Create a topic, or return the existing one (case-insensitive deduplication)."""
-    q = await session.execute(
-        select(Topic).where(sql_func.lower(Topic.name) == name.lower())
-    )
+    """Create a topic, or return the existing one (case-insensitive, namespace-scoped dedup).
+
+    D-08: user_id=None creates a system topic (visible to all users).
+    D-08: user_id=<uuid> creates a per-user topic (visible only to that user).
+
+    Deduplication is scoped by user_id namespace:
+      - System topics (user_id=None) dedup against other system topics only
+      - Per-user topics dedup within that user's namespace only
+    This allows "Finance" to exist as both a system topic and a per-user topic.
+
+    SQLite note: Uses a branching approach instead of IS NOT DISTINCT FROM
+    (SQLite doesn't support that PostgreSQL construct for NULL comparison).
+    """
+    if user_id is None:
+        q = await session.execute(
+            select(Topic).where(
+                sql_func.lower(Topic.name) == name.lower(),
+                Topic.user_id.is_(None),
+            )
+        )
+    else:
+        q = await session.execute(
+            select(Topic).where(
+                sql_func.lower(Topic.name) == name.lower(),
+                Topic.user_id == user_id,
+            )
+        )
    existing = q.scalars().first()
    if existing is not None:
        return {
@@ -307,7 +349,7 @@ async def create_topic(
            "color": existing.color,
        }

-    topic = Topic(name=name, description=description, color=color)
+    topic = Topic(name=name, description=description, color=color, user_id=user_id)
    session.add(topic)
    await session.commit()
    return {
@@ -361,13 +403,27 @@ async def delete_topic(session: AsyncSession, topic_id: str) -> Optional[str]:
    return name


-async def topic_doc_counts(session: AsyncSession) -> dict:
-    """Return a mapping of topic name -> document count."""
-    q = await session.execute(
+async def topic_doc_counts(
+    session: AsyncSession, user_id: Optional[uuid.UUID] = None
+) -> dict:
+    """Return a mapping of topic name -> document count.
+
+    If user_id is provided, counts only documents belonging to that user.
+    This ensures a user sees the count of their own documents for each topic,
+    not the global count across all users.
+    """
+    stmt = (
        select(Topic.name, sql_func.count(DocumentTopic.document_id))
        .join(DocumentTopic, DocumentTopic.topic_id == Topic.id, isouter=True)
-        .group_by(Topic.name)
    )
+    if user_id is not None:
+        stmt = stmt.join(
+            Document, Document.id == DocumentTopic.document_id, isouter=True
+        ).where(
+            or_(Document.user_id == user_id, Document.user_id.is_(None))
+        )
+    stmt = stmt.group_by(Topic.name)
+    q = await session.execute(stmt)
    return {name: count for name, count in q}


@@ -422,6 +478,7 @@ __all__ = [
    "update_document_topics",
    "remove_topic_from_all_documents",
    "load_topics",
+    "load_topics_for_user",
    "save_topics",
    "get_topic",
    "create_topic",