feat: implement service-specific Modal API keys with auto processor pattern (#528)

* fix: refactor modal API key configuration for better separation of concerns - Split generic MODAL_API_KEY into service-specific keys: - TRANSCRIPT_API_KEY for transcription service - DIARIZATION_API_KEY for diarization service - TRANSLATE_API_KEY for translation service - Remove deprecated *_MODAL_API_KEY settings - Add proper validation to ensure URLs are set when using modal processors - Update README with new configuration format BREAKING CHANGE: Configuration keys have changed. Update your .env file: - TRANSCRIPT_MODAL_API_KEY → TRANSCRIPT_API_KEY - LLM_MODAL_API_KEY → (removed, use TRANSCRIPT_API_KEY) - Add DIARIZATION_API_KEY and TRANSLATE_API_KEY if using those services * fix: update Modal backend configuration to use service-specific API keys - Changed from generic MODAL_API_KEY to service-specific keys: - TRANSCRIPT_MODAL_API_KEY for transcription - DIARIZATION_MODAL_API_KEY for diarization - TRANSLATION_MODAL_API_KEY for translation - Updated audio_transcript_modal.py and audio_diarization_modal.py to use modal_api_key parameter - Updated documentation in README.md, CLAUDE.md, and env.example * feat: implement auto/modal pattern for translation processor - Created TranscriptTranslatorAutoProcessor following the same pattern as transcript/diarization - Created TranscriptTranslatorModalProcessor with TRANSLATION_MODAL_API_KEY support - Added TRANSLATION_BACKEND setting (defaults to "modal") - Updated all imports to use TranscriptTranslatorAutoProcessor instead of TranscriptTranslatorProcessor - Updated env.example with TRANSLATION_BACKEND and TRANSLATION_MODAL_API_KEY - Updated test to expect TranscriptTranslatorModalProcessor name - All tests passing * refactor: simplify transcript_translator base class to match other processors - Moved all implementation from base class to modal processor - Base class now only defines abstract _translate method - Follows the same minimal pattern as audio_diarization and audio_transcript base classes - Updated test mock to use _translate instead of get_translation - All tests passing * chore: clean up settings and improve type annotations - Remove deprecated generic API key variables from settings - Add comments to group Modal-specific settings - Improve type annotations for modal_api_key parameters * fix: typing * fix: passing key to openai * test: fix rtc test failing due to change on transcript It also correctly setup database from sqlite, in case our configuration is setup to postgres. * ci: deactivate translation backend by default * test: fix modal->mock * refactor: implementing igor review, mock to passthrough
2026-02-04 09:56:47 +00:00 · 2025-08-04 12:07:30 -06:00
parent 5bd8233657
commit dc177af3ff
20 changed files with 220 additions and 85 deletions
--- a/server/tests/conftest.py
+++ b/server/tests/conftest.py
@@ -7,15 +7,11 @@ import pytest
@pytest.fixture(scope="function", autouse=True)
@pytest.mark.asyncio
 async def setup_database():
-    from reflector.settings import settings
+    from reflector.db import engine, metadata  # noqa

-    with NamedTemporaryFile() as f:
-        settings.DATABASE_URL = f"sqlite:///{f.name}"
-        from reflector.db import engine, metadata
-
-        metadata.create_all(bind=engine)
-
-        yield
+    metadata.drop_all(bind=engine)
+    metadata.create_all(bind=engine)
+    yield


@pytest.fixture
@@ -33,9 +29,6 @@ def dummy_processors():
        patch(
            "reflector.processors.transcript_final_summary.TranscriptFinalSummaryProcessor.get_short_summary"
        ) as mock_short_summary,
-        patch(
-            "reflector.processors.transcript_translator.TranscriptTranslatorProcessor.get_translation"
-        ) as mock_translate,
    ):
        from reflector.processors.transcript_topic_detector import TopicResponse

@@ -45,9 +38,7 @@ def dummy_processors():
        mock_title.return_value = "LLM Title"
        mock_long_summary.return_value = "LLM LONG SUMMARY"
        mock_short_summary.return_value = "LLM SHORT SUMMARY"
-        mock_translate.return_value = "Bonjour le monde"
        yield (
-            mock_translate,
            mock_topic,
            mock_title,
            mock_long_summary,
@@ -105,6 +96,27 @@ async def dummy_diarization():
        yield


+@pytest.fixture
+async def dummy_transcript_translator():
+    from reflector.processors.transcript_translator import TranscriptTranslatorProcessor
+
+    class TestTranscriptTranslatorProcessor(TranscriptTranslatorProcessor):
+        async def _translate(self, text: str) -> str:
+            source_language = self.get_pref("audio:source_language", "en")
+            target_language = self.get_pref("audio:target_language", "en")
+            return f"{source_language}:{target_language}:{text}"
+
+    def mock_new(cls, *args, **kwargs):
+        return TestTranscriptTranslatorProcessor(*args, **kwargs)
+
+    with patch(
+        "reflector.processors.transcript_translator_auto"
+        ".TranscriptTranslatorAutoProcessor.__new__",
+        mock_new,
+    ):
+        yield
+
+
@pytest.fixture
 async def dummy_llm():
    from reflector.llm import LLM
--- a/server/tests/test_processors_pipeline.py
+++ b/server/tests/test_processors_pipeline.py
@@ -33,7 +33,7 @@ async def test_basic_process(

    # validate the events
    assert marks["TranscriptLinerProcessor"] == 1
-    assert marks["TranscriptTranslatorProcessor"] == 1
+    assert marks["TranscriptTranslatorPassthroughProcessor"] == 1
    assert marks["TranscriptTopicDetectorProcessor"] == 1
    assert marks["TranscriptFinalSummaryProcessor"] == 1
    assert marks["TranscriptFinalTitleProcessor"] == 1
--- a/server/tests/test_transcripts_rtc_ws.py
+++ b/server/tests/test_transcripts_rtc_ws.py
@@ -67,6 +67,7 @@ async def test_transcript_rtc_and_websocket(
    dummy_transcript,
    dummy_processors,
    dummy_diarization,
+    dummy_transcript_translator,
    dummy_storage,
    fake_mp3_upload,
    appserver,
@@ -164,7 +165,7 @@ async def test_transcript_rtc_and_websocket(
    assert "TRANSCRIPT" in eventnames
    ev = events[eventnames.index("TRANSCRIPT")]
    assert ev["data"]["text"].startswith("Hello world.")
-    assert ev["data"]["translation"] == "Bonjour le monde"
+    assert ev["data"]["translation"] is None

    assert "TOPIC" in eventnames
    ev = events[eventnames.index("TOPIC")]
@@ -224,6 +225,7 @@ async def test_transcript_rtc_and_websocket_and_fr(
    dummy_transcript,
    dummy_processors,
    dummy_diarization,
+    dummy_transcript_translator,
    dummy_storage,
    fake_mp3_upload,
    appserver,
@@ -330,7 +332,7 @@ async def test_transcript_rtc_and_websocket_and_fr(
    assert "TRANSCRIPT" in eventnames
    ev = events[eventnames.index("TRANSCRIPT")]
    assert ev["data"]["text"].startswith("Hello world.")
-    assert ev["data"]["translation"] == "Bonjour le monde"
+    assert ev["data"]["translation"] == "en:fr:Hello world."

    assert "TOPIC" in eventnames
    ev = events[eventnames.index("TOPIC")]