From 06b0abaf624c48af7be1e3e230799236cb5e6d23 Mon Sep 17 00:00:00 2001 From: projects-g <63178974+projects-g@users.noreply.github.com> Date: Thu, 20 Jun 2024 12:07:28 +0530 Subject: [PATCH] deployment fix (#364) --- server/gpu/{modal => modal_deployments}/README.md | 0 .../gpu/{modal => modal_deployments}/reflector_diarizer.py | 6 +++--- server/gpu/{modal => modal_deployments}/reflector_llm.py | 0 .../{modal => modal_deployments}/reflector_llm_zephyr.py | 0 .../{modal => modal_deployments}/reflector_transcriber.py | 0 .../{modal => modal_deployments}/reflector_translator.py | 0 6 files changed, 3 insertions(+), 3 deletions(-) rename server/gpu/{modal => modal_deployments}/README.md (100%) rename server/gpu/{modal => modal_deployments}/reflector_diarizer.py (96%) rename server/gpu/{modal => modal_deployments}/reflector_llm.py (100%) rename server/gpu/{modal => modal_deployments}/reflector_llm_zephyr.py (100%) rename server/gpu/{modal => modal_deployments}/reflector_transcriber.py (100%) rename server/gpu/{modal => modal_deployments}/reflector_translator.py (100%) diff --git a/server/gpu/modal/README.md b/server/gpu/modal_deployments/README.md similarity index 100% rename from server/gpu/modal/README.md rename to server/gpu/modal_deployments/README.md diff --git a/server/gpu/modal/reflector_diarizer.py b/server/gpu/modal_deployments/reflector_diarizer.py similarity index 96% rename from server/gpu/modal/reflector_diarizer.py rename to server/gpu/modal_deployments/reflector_diarizer.py index 1a0e9f0a..ddab9950 100644 --- a/server/gpu/modal/reflector_diarizer.py +++ b/server/gpu/modal_deployments/reflector_diarizer.py @@ -11,7 +11,6 @@ from pydantic import BaseModel PYANNOTE_MODEL_NAME: str = "pyannote/speaker-diarization-3.0" MODEL_DIR = "/root/diarization_models" -HUGGINGFACE_TOKEN = modal.Secret.from_name("my-huggingface-secret") stub = Stub(name="reflector-diarizer") @@ -34,7 +33,7 @@ def download_pyannote_audio(): Pipeline.from_pretrained( "pyannote/speaker-diarization-3.0", cache_dir=MODEL_DIR, - use_auth_token=HUGGINGFACE_TOKEN + use_auth_token=os.environ["HF_TOKEN"] ) @@ -55,7 +54,7 @@ diarizer_image = ( "hf-transfer" ) .run_function(migrate_cache_llm) - .run_function(download_pyannote_audio) + .run_function(download_pyannote_audio, secrets=[modal.Secret.from_name("my-huggingface-secret")]) .env( { "LD_LIBRARY_PATH": ( @@ -73,6 +72,7 @@ diarizer_image = ( container_idle_timeout=60, allow_concurrent_inputs=1, image=diarizer_image, + secrets=[modal.Secret.from_name("my-huggingface-secret")], ) class Diarizer: def __enter__(self): diff --git a/server/gpu/modal/reflector_llm.py b/server/gpu/modal_deployments/reflector_llm.py similarity index 100% rename from server/gpu/modal/reflector_llm.py rename to server/gpu/modal_deployments/reflector_llm.py diff --git a/server/gpu/modal/reflector_llm_zephyr.py b/server/gpu/modal_deployments/reflector_llm_zephyr.py similarity index 100% rename from server/gpu/modal/reflector_llm_zephyr.py rename to server/gpu/modal_deployments/reflector_llm_zephyr.py diff --git a/server/gpu/modal/reflector_transcriber.py b/server/gpu/modal_deployments/reflector_transcriber.py similarity index 100% rename from server/gpu/modal/reflector_transcriber.py rename to server/gpu/modal_deployments/reflector_transcriber.py diff --git a/server/gpu/modal/reflector_translator.py b/server/gpu/modal_deployments/reflector_translator.py similarity index 100% rename from server/gpu/modal/reflector_translator.py rename to server/gpu/modal_deployments/reflector_translator.py