server: add API to reassign speakers, and get topics with words

2026-04-20 12:16:55 +00:00 · 2023-12-06 16:41:18 +01:00
parent 84a1350df7
commit 6f3d7df507
6 changed files with 306 additions and 8 deletions
--- a/server/reflector/app.py
+++ b/server/reflector/app.py
@@ -17,6 +17,7 @@ from reflector.views.transcripts_audio import router as transcripts_audio_router
 from reflector.views.transcripts_participants import (
    router as transcripts_participants_router,
 )
+from reflector.views.transcripts_speaker import router as transcripts_speaker_router
 from reflector.views.transcripts_webrtc import router as transcripts_webrtc_router
 from reflector.views.transcripts_websocket import router as transcripts_websocket_router
 from reflector.views.user import router as user_router
@@ -68,6 +69,7 @@ app.include_router(rtc_offer_router)
 app.include_router(transcripts_router, prefix="/v1")
 app.include_router(transcripts_audio_router, prefix="/v1")
 app.include_router(transcripts_participants_router, prefix="/v1")
+app.include_router(transcripts_speaker_router, prefix="/v1")
 app.include_router(transcripts_websocket_router, prefix="/v1")
 app.include_router(transcripts_webrtc_router, prefix="/v1")
 app.include_router(user_router, prefix="/v1")
--- a/server/reflector/db/transcripts.py
+++ b/server/reflector/db/transcripts.py
@@ -362,7 +362,7 @@ class TranscriptController:
        await database.execute(query)
        return transcript

-    async def update(self, transcript: Transcript, values: dict):
+    async def update(self, transcript: Transcript, values: dict, mutate=True):
        """
        Update a transcript fields with key/values in values
        """
@@ -372,8 +372,9 @@ class TranscriptController:
            .values(**values)
        )
        await database.execute(query)
-        for key, value in values.items():
-            setattr(transcript, key, value)
+        if mutate:
+            for key, value in values.items():
+                setattr(transcript, key, value)

    async def remove_by_id(
        self,
@@ -410,7 +411,11 @@ class TranscriptController:
        Append an event to a transcript
        """
        resp = transcript.add_event(event=event, data=data)
-        await self.update(transcript, {"events": transcript.events_dump()})
+        await self.update(
+            transcript,
+            {"events": transcript.events_dump()},
+            mutate=False,
+        )
        return resp

    async def upsert_topic(
@@ -422,7 +427,11 @@ class TranscriptController:
        Append an event to a transcript
        """
        transcript.upsert_topic(topic)
-        await self.update(transcript, {"topics": transcript.topics_dump()})
+        await self.update(
+            transcript,
+            {"topics": transcript.topics_dump()},
+            mutate=False,
+        )

    async def move_mp3_to_storage(self, transcript: Transcript):
        """
@@ -450,7 +459,11 @@ class TranscriptController:
        Add/update a participant to a transcript
        """
        result = transcript.upsert_participant(participant)
-        await self.update(transcript, {"participants": transcript.participants_dump()})
+        await self.update(
+            transcript,
+            {"participants": transcript.participants_dump()},
+            mutate=False,
+        )
        return result

    async def delete_participant(
@@ -462,7 +475,11 @@ class TranscriptController:
        Delete a participant from a transcript
        """
        transcript.delete_participant(participant_id)
-        await self.update(transcript, {"participants": transcript.participants_dump()})
+        await self.update(
+            transcript,
+            {"participants": transcript.participants_dump()},
+            mutate=False,
+        )


 transcripts_controller = TranscriptController()
--- a/server/reflector/views/transcripts.py
+++ b/server/reflector/views/transcripts.py
@@ -13,6 +13,7 @@ from reflector.db.transcripts import (
    transcripts_controller,
 )
 from reflector.processors.types import Transcript as ProcessorTranscript
+from reflector.processors.types import Word
 from reflector.settings import settings

 router = APIRouter()
@@ -159,6 +160,17 @@ class GetTranscriptTopic(BaseModel):
        )


+class GetTranscriptTopicWithWords(GetTranscriptTopic):
+    words: list[Word] = []
+
+    @classmethod
+    def from_transcript_topic(cls, topic: TranscriptTopic):
+        instance = super().from_transcript_topic(topic)
+        if topic.words:
+            instance.words = topic.words
+        return instance
+
+
@router.get("/transcripts/{transcript_id}", response_model=GetTranscript)
 async def transcript_get(
    transcript_id: str,
@@ -215,3 +227,23 @@ async def transcript_get_topics(
    return [
        GetTranscriptTopic.from_transcript_topic(topic) for topic in transcript.topics
    ]
+
+
+@router.get(
+    "/transcripts/{transcript_id}/topics/with-words",
+    response_model=list[GetTranscriptTopicWithWords],
+)
+async def transcript_get_topics_with_words(
+    transcript_id: str,
+    user: Annotated[Optional[auth.UserInfo], Depends(auth.current_user_optional)],
+):
+    user_id = user["sub"] if user else None
+    transcript = await transcripts_controller.get_by_id_for_http(
+        transcript_id, user_id=user_id
+    )
+
+    # convert to GetTranscriptTopicWithWords
+    return [
+        GetTranscriptTopicWithWords.from_transcript_topic(topic)
+        for topic in transcript.topics
+    ]
--- a/server/reflector/views/transcripts_speaker.py
+++ b/server/reflector/views/transcripts_speaker.py
@@ -0,0 +1,63 @@
+"""
+Reassign speakers in a transcript
+=================================
+
+"""
+from typing import Annotated, Optional
+
+import reflector.auth as auth
+from fastapi import APIRouter, Depends, HTTPException
+from pydantic import BaseModel
+from reflector.db.transcripts import transcripts_controller
+
+router = APIRouter()
+
+
+class SpeakerAssignment(BaseModel):
+    speaker: int
+    timestamp_from: float
+    timestamp_to: float
+
+
+class SpeakerAssignmentStatus(BaseModel):
+    status: str
+
+
+@router.patch("/transcripts/{transcript_id}/speaker/assign")
+async def transcript_assign_speaker(
+    transcript_id: str,
+    assignment: SpeakerAssignment,
+    user: Annotated[Optional[auth.UserInfo], Depends(auth.current_user_optional)],
+) -> SpeakerAssignmentStatus:
+    user_id = user["sub"] if user else None
+    transcript = await transcripts_controller.get_by_id_for_http(
+        transcript_id, user_id=user_id
+    )
+
+    if not transcript:
+        raise HTTPException(status_code=404, detail="Transcript not found")
+
+    # reassign speakers from words in the transcript
+    ts_from = assignment.timestamp_from
+    ts_to = assignment.timestamp_to
+    changed_topics = []
+    for topic in transcript.topics:
+        changed = False
+        for word in topic.words:
+            if ts_from <= word.start <= ts_to:
+                word.speaker = assignment.speaker
+                changed = True
+        if changed:
+            changed_topics.append(topic)
+
+    # batch changes
+    for topic in changed_topics:
+        transcript.upsert_topic(topic)
+    await transcripts_controller.update(
+        transcript,
+        {
+            "topics": transcript.topics_dump(),
+        },
+    )
+
+    return SpeakerAssignmentStatus(status="ok")