server: refactor with diarization, logic works

2026-02-04 09:56:47 +00:00 · 2023-10-27 15:59:27 +02:00
parent 1c42473da0
commit 07c4d080c2
17 changed files with 387 additions and 169 deletions
--- a/server/tests/conftest.py
+++ b/server/tests/conftest.py
@@ -45,17 +45,16 @@ async def dummy_transcript():
    from reflector.processors.types import AudioFile, Transcript, Word

    class TestAudioTranscriptProcessor(AudioTranscriptProcessor):
-        async def _transcript(self, data: AudioFile):
-            source_language = self.get_pref("audio:source_language", "en")
-            print("transcripting", source_language)
-            print("pipeline", self.pipeline)
-            print("prefs", self.pipeline.prefs)
+        _time_idx = 0

+        async def _transcript(self, data: AudioFile):
+            i = self._time_idx
+            self._time_idx += 2
            return Transcript(
                text="Hello world.",
                words=[
-                    Word(start=0.0, end=1.0, text="Hello"),
-                    Word(start=1.0, end=2.0, text=" world."),
+                    Word(start=i, end=i + 1, text="Hello", speaker=0),
+                    Word(start=i + 1, end=i + 2, text=" world.", speaker=0),
                ],
            )

@@ -98,7 +97,17 @@ def ensure_casing():
@pytest.fixture
 def sentence_tokenize():
    with patch(
-        "reflector.processors.TranscriptFinalLongSummaryProcessor" ".sentence_tokenize"
+        "reflector.processors.TranscriptFinalLongSummaryProcessor.sentence_tokenize"
    ) as mock_sent_tokenize:
        mock_sent_tokenize.return_value = ["LLM LONG SUMMARY"]
        yield
+
+
+@pytest.fixture(scope="session")
+def celery_enable_logging():
+    return True
+
+
+@pytest.fixture(scope="session")
+def celery_config():
+    return {"broker_url": "memory://", "result_backend": "rpc"}