mirror of
https://github.com/Monadical-SAS/reflector.git
synced 2025-12-21 12:49:06 +00:00
Compare commits
20 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
| af921ce927 | |||
|
|
bd5df1ce2e | ||
| c8024484b3 | |||
| 28f87c09dc | |||
| dabf7251db | |||
|
|
b51b7aa917 | ||
|
|
a8983b4e7e | ||
|
|
fe47c46489 | ||
| a2bb6a27d6 | |||
| 7f0b728991 | |||
| 692895c859 | |||
|
|
d63040e2fd | ||
| 8d696aa775 | |||
| f6ca07505f | |||
|
|
3aef926203 | ||
|
|
0b2c82227d | ||
|
|
689c8075cc | ||
| 201671368a | |||
|
|
86d5e26224 | ||
| 9bec39808f |
51
CHANGELOG.md
51
CHANGELOG.md
@@ -1,5 +1,56 @@
|
|||||||
# Changelog
|
# Changelog
|
||||||
|
|
||||||
|
## [0.22.4](https://github.com/Monadical-SAS/reflector/compare/v0.22.3...v0.22.4) (2025-12-02)
|
||||||
|
|
||||||
|
|
||||||
|
### Bug Fixes
|
||||||
|
|
||||||
|
* Multitrack mixdown optimisation 2 ([#764](https://github.com/Monadical-SAS/reflector/issues/764)) ([bd5df1c](https://github.com/Monadical-SAS/reflector/commit/bd5df1ce2ebf35d7f3413b295e56937a9a28ef7b))
|
||||||
|
|
||||||
|
## [0.22.3](https://github.com/Monadical-SAS/reflector/compare/v0.22.2...v0.22.3) (2025-12-02)
|
||||||
|
|
||||||
|
|
||||||
|
### Bug Fixes
|
||||||
|
|
||||||
|
* align daily room settings ([#759](https://github.com/Monadical-SAS/reflector/issues/759)) ([28f87c0](https://github.com/Monadical-SAS/reflector/commit/28f87c09dc459846873d0dde65b03e3d7b2b9399))
|
||||||
|
|
||||||
|
## [0.22.2](https://github.com/Monadical-SAS/reflector/compare/v0.22.1...v0.22.2) (2025-12-02)
|
||||||
|
|
||||||
|
|
||||||
|
### Bug Fixes
|
||||||
|
|
||||||
|
* daily auto refresh fix ([#755](https://github.com/Monadical-SAS/reflector/issues/755)) ([fe47c46](https://github.com/Monadical-SAS/reflector/commit/fe47c46489c5aa0cc538109f7559cc9accb35c01))
|
||||||
|
* Skip mixdown for multitrack ([#760](https://github.com/Monadical-SAS/reflector/issues/760)) ([b51b7aa](https://github.com/Monadical-SAS/reflector/commit/b51b7aa9176c1a53ba57ad99f5e976c804a1e80c))
|
||||||
|
|
||||||
|
## [0.22.1](https://github.com/Monadical-SAS/reflector/compare/v0.22.0...v0.22.1) (2025-11-27)
|
||||||
|
|
||||||
|
|
||||||
|
### Bug Fixes
|
||||||
|
|
||||||
|
* participants update from daily ([#749](https://github.com/Monadical-SAS/reflector/issues/749)) ([7f0b728](https://github.com/Monadical-SAS/reflector/commit/7f0b728991c1b9f9aae702c96297eae63b561ef5))
|
||||||
|
|
||||||
|
## [0.22.0](https://github.com/Monadical-SAS/reflector/compare/v0.21.0...v0.22.0) (2025-11-26)
|
||||||
|
|
||||||
|
|
||||||
|
### Features
|
||||||
|
|
||||||
|
* Multitrack segmentation ([#747](https://github.com/Monadical-SAS/reflector/issues/747)) ([d63040e](https://github.com/Monadical-SAS/reflector/commit/d63040e2fdc07e7b272e85a39eb2411cd6a14798))
|
||||||
|
|
||||||
|
## [0.21.0](https://github.com/Monadical-SAS/reflector/compare/v0.20.0...v0.21.0) (2025-11-26)
|
||||||
|
|
||||||
|
|
||||||
|
### Features
|
||||||
|
|
||||||
|
* add transcript format parameter to GET endpoint ([#709](https://github.com/Monadical-SAS/reflector/issues/709)) ([f6ca075](https://github.com/Monadical-SAS/reflector/commit/f6ca07505f34483b02270a2ef3bd809e9d2e1045))
|
||||||
|
|
||||||
|
## [0.20.0](https://github.com/Monadical-SAS/reflector/compare/v0.19.0...v0.20.0) (2025-11-25)
|
||||||
|
|
||||||
|
|
||||||
|
### Features
|
||||||
|
|
||||||
|
* link transcript participants ([#737](https://github.com/Monadical-SAS/reflector/issues/737)) ([9bec398](https://github.com/Monadical-SAS/reflector/commit/9bec39808fc6322612d8b87e922a6f7901fc01c1))
|
||||||
|
* transcript restart script ([#742](https://github.com/Monadical-SAS/reflector/issues/742)) ([86d5e26](https://github.com/Monadical-SAS/reflector/commit/86d5e26224bb55a0f1cc785aeda52065bb92ee6f))
|
||||||
|
|
||||||
## [0.19.0](https://github.com/Monadical-SAS/reflector/compare/v0.18.0...v0.19.0) (2025-11-25)
|
## [0.19.0](https://github.com/Monadical-SAS/reflector/compare/v0.18.0...v0.19.0) (2025-11-25)
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@@ -168,6 +168,12 @@ You can manually process an audio file by calling the process tool:
|
|||||||
uv run python -m reflector.tools.process path/to/audio.wav
|
uv run python -m reflector.tools.process path/to/audio.wav
|
||||||
```
|
```
|
||||||
|
|
||||||
|
## Reprocessing any transcription
|
||||||
|
|
||||||
|
```bash
|
||||||
|
uv run -m reflector.tools.process_transcript 81ec38d1-9dd7-43d2-b3f8-51f4d34a07cd --sync
|
||||||
|
```
|
||||||
|
|
||||||
## Build-time env variables
|
## Build-time env variables
|
||||||
|
|
||||||
Next.js projects are more used to NEXT_PUBLIC_ prefixed buildtime vars. We don't have those for the reason we need to serve a ccustomizable prebuild docker container.
|
Next.js projects are more used to NEXT_PUBLIC_ prefixed buildtime vars. We don't have those for the reason we need to serve a ccustomizable prebuild docker container.
|
||||||
|
|||||||
241
docs/transcript.md
Normal file
241
docs/transcript.md
Normal file
@@ -0,0 +1,241 @@
|
|||||||
|
# Transcript Formats
|
||||||
|
|
||||||
|
The Reflector API provides multiple output formats for transcript data through the `transcript_format` query parameter on the GET `/v1/transcripts/{id}` endpoint.
|
||||||
|
|
||||||
|
## Overview
|
||||||
|
|
||||||
|
When retrieving a transcript, you can specify the desired format using the `transcript_format` query parameter. The API supports four formats optimized for different use cases:
|
||||||
|
|
||||||
|
- **text** - Plain text with speaker names (default)
|
||||||
|
- **text-timestamped** - Timestamped text with speaker names
|
||||||
|
- **webvtt-named** - WebVTT subtitle format with participant names
|
||||||
|
- **json** - Structured JSON segments with full metadata
|
||||||
|
|
||||||
|
All formats include participant information when available, resolving speaker IDs to actual names.
|
||||||
|
|
||||||
|
## Query Parameter Usage
|
||||||
|
|
||||||
|
```
|
||||||
|
GET /v1/transcripts/{id}?transcript_format={format}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Parameters
|
||||||
|
|
||||||
|
- `transcript_format` (optional): The desired output format
|
||||||
|
- Type: `"text" | "text-timestamped" | "webvtt-named" | "json"`
|
||||||
|
- Default: `"text"`
|
||||||
|
|
||||||
|
## Format Descriptions
|
||||||
|
|
||||||
|
### Text Format (`text`)
|
||||||
|
|
||||||
|
**Use case:** Simple, human-readable transcript for display or export.
|
||||||
|
|
||||||
|
**Format:** Speaker names followed by their dialogue, one line per segment.
|
||||||
|
|
||||||
|
**Example:**
|
||||||
|
```
|
||||||
|
John Smith: Hello everyone
|
||||||
|
Jane Doe: Hi there
|
||||||
|
John Smith: How are you today?
|
||||||
|
```
|
||||||
|
|
||||||
|
**Request:**
|
||||||
|
```bash
|
||||||
|
GET /v1/transcripts/{id}?transcript_format=text
|
||||||
|
```
|
||||||
|
|
||||||
|
**Response:**
|
||||||
|
```json
|
||||||
|
{
|
||||||
|
"id": "transcript_123",
|
||||||
|
"name": "Meeting Recording",
|
||||||
|
"transcript_format": "text",
|
||||||
|
"transcript": "John Smith: Hello everyone\nJane Doe: Hi there\nJohn Smith: How are you today?",
|
||||||
|
"participants": [
|
||||||
|
{"id": "p1", "speaker": 0, "name": "John Smith"},
|
||||||
|
{"id": "p2", "speaker": 1, "name": "Jane Doe"}
|
||||||
|
],
|
||||||
|
...
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Text Timestamped Format (`text-timestamped`)
|
||||||
|
|
||||||
|
**Use case:** Transcript with timing information for navigation or reference.
|
||||||
|
|
||||||
|
**Format:** `[MM:SS]` timestamp prefix before each speaker and dialogue.
|
||||||
|
|
||||||
|
**Example:**
|
||||||
|
```
|
||||||
|
[00:00] John Smith: Hello everyone
|
||||||
|
[00:05] Jane Doe: Hi there
|
||||||
|
[00:12] John Smith: How are you today?
|
||||||
|
```
|
||||||
|
|
||||||
|
**Request:**
|
||||||
|
```bash
|
||||||
|
GET /v1/transcripts/{id}?transcript_format=text-timestamped
|
||||||
|
```
|
||||||
|
|
||||||
|
**Response:**
|
||||||
|
```json
|
||||||
|
{
|
||||||
|
"id": "transcript_123",
|
||||||
|
"name": "Meeting Recording",
|
||||||
|
"transcript_format": "text-timestamped",
|
||||||
|
"transcript": "[00:00] John Smith: Hello everyone\n[00:05] Jane Doe: Hi there\n[00:12] John Smith: How are you today?",
|
||||||
|
"participants": [
|
||||||
|
{"id": "p1", "speaker": 0, "name": "John Smith"},
|
||||||
|
{"id": "p2", "speaker": 1, "name": "Jane Doe"}
|
||||||
|
],
|
||||||
|
...
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### WebVTT Named Format (`webvtt-named`)
|
||||||
|
|
||||||
|
**Use case:** Subtitle files for video players, accessibility tools, or video editing.
|
||||||
|
|
||||||
|
**Format:** Standard WebVTT subtitle format with voice tags using participant names.
|
||||||
|
|
||||||
|
**Example:**
|
||||||
|
```
|
||||||
|
WEBVTT
|
||||||
|
|
||||||
|
00:00:00.000 --> 00:00:05.000
|
||||||
|
<v John Smith>Hello everyone
|
||||||
|
|
||||||
|
00:00:05.000 --> 00:00:12.000
|
||||||
|
<v Jane Doe>Hi there
|
||||||
|
|
||||||
|
00:00:12.000 --> 00:00:18.000
|
||||||
|
<v John Smith>How are you today?
|
||||||
|
```
|
||||||
|
|
||||||
|
**Request:**
|
||||||
|
```bash
|
||||||
|
GET /v1/transcripts/{id}?transcript_format=webvtt-named
|
||||||
|
```
|
||||||
|
|
||||||
|
**Response:**
|
||||||
|
```json
|
||||||
|
{
|
||||||
|
"id": "transcript_123",
|
||||||
|
"name": "Meeting Recording",
|
||||||
|
"transcript_format": "webvtt-named",
|
||||||
|
"transcript": "WEBVTT\n\n00:00:00.000 --> 00:00:05.000\n<v John Smith>Hello everyone\n\n...",
|
||||||
|
"participants": [
|
||||||
|
{"id": "p1", "speaker": 0, "name": "John Smith"},
|
||||||
|
{"id": "p2", "speaker": 1, "name": "Jane Doe"}
|
||||||
|
],
|
||||||
|
...
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### JSON Format (`json`)
|
||||||
|
|
||||||
|
**Use case:** Programmatic access with full timing and speaker metadata.
|
||||||
|
|
||||||
|
**Format:** Array of segment objects with speaker information, text content, and precise timing.
|
||||||
|
|
||||||
|
**Example:**
|
||||||
|
```json
|
||||||
|
[
|
||||||
|
{
|
||||||
|
"speaker": 0,
|
||||||
|
"speaker_name": "John Smith",
|
||||||
|
"text": "Hello everyone",
|
||||||
|
"start": 0.0,
|
||||||
|
"end": 5.0
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"speaker": 1,
|
||||||
|
"speaker_name": "Jane Doe",
|
||||||
|
"text": "Hi there",
|
||||||
|
"start": 5.0,
|
||||||
|
"end": 12.0
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"speaker": 0,
|
||||||
|
"speaker_name": "John Smith",
|
||||||
|
"text": "How are you today?",
|
||||||
|
"start": 12.0,
|
||||||
|
"end": 18.0
|
||||||
|
}
|
||||||
|
]
|
||||||
|
```
|
||||||
|
|
||||||
|
**Request:**
|
||||||
|
```bash
|
||||||
|
GET /v1/transcripts/{id}?transcript_format=json
|
||||||
|
```
|
||||||
|
|
||||||
|
**Response:**
|
||||||
|
```json
|
||||||
|
{
|
||||||
|
"id": "transcript_123",
|
||||||
|
"name": "Meeting Recording",
|
||||||
|
"transcript_format": "json",
|
||||||
|
"transcript": [
|
||||||
|
{
|
||||||
|
"speaker": 0,
|
||||||
|
"speaker_name": "John Smith",
|
||||||
|
"text": "Hello everyone",
|
||||||
|
"start": 0.0,
|
||||||
|
"end": 5.0
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"speaker": 1,
|
||||||
|
"speaker_name": "Jane Doe",
|
||||||
|
"text": "Hi there",
|
||||||
|
"start": 5.0,
|
||||||
|
"end": 12.0
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"participants": [
|
||||||
|
{"id": "p1", "speaker": 0, "name": "John Smith"},
|
||||||
|
{"id": "p2", "speaker": 1, "name": "Jane Doe"}
|
||||||
|
],
|
||||||
|
...
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
## Response Structure
|
||||||
|
|
||||||
|
All formats return the same base transcript metadata with an additional `transcript_format` field and format-specific `transcript` field:
|
||||||
|
|
||||||
|
### Common Fields
|
||||||
|
|
||||||
|
- `id`: Transcript identifier
|
||||||
|
- `user_id`: Owner user ID (if authenticated)
|
||||||
|
- `name`: Transcript name
|
||||||
|
- `status`: Processing status
|
||||||
|
- `locked`: Whether transcript is locked for editing
|
||||||
|
- `duration`: Total duration in seconds
|
||||||
|
- `title`: Auto-generated or custom title
|
||||||
|
- `short_summary`: Brief summary
|
||||||
|
- `long_summary`: Detailed summary
|
||||||
|
- `created_at`: Creation timestamp
|
||||||
|
- `share_mode`: Access control setting
|
||||||
|
- `source_language`: Original audio language
|
||||||
|
- `target_language`: Translation target language
|
||||||
|
- `reviewed`: Whether transcript has been reviewed
|
||||||
|
- `meeting_id`: Associated meeting ID (if applicable)
|
||||||
|
- `source_kind`: Source type (live, file, room)
|
||||||
|
- `room_id`: Associated room ID (if applicable)
|
||||||
|
- `audio_deleted`: Whether audio has been deleted
|
||||||
|
- `participants`: Array of participant objects with speaker mappings
|
||||||
|
|
||||||
|
### Format-Specific Fields
|
||||||
|
|
||||||
|
- `transcript_format`: The format identifier (discriminator field)
|
||||||
|
- `transcript`: The formatted transcript content (string for text/webvtt formats, array for json format)
|
||||||
|
|
||||||
|
## Speaker Name Resolution
|
||||||
|
|
||||||
|
All formats resolve speaker IDs to participant names when available:
|
||||||
|
|
||||||
|
- If a participant exists for the speaker ID, their name is used
|
||||||
|
- If no participant exists, a default name like "Speaker 0" is generated
|
||||||
|
- Speaker IDs are integers (0, 1, 2, etc.) assigned during diarization
|
||||||
38
server/migrations/versions/bbafedfa510c_add_user_table.py
Normal file
38
server/migrations/versions/bbafedfa510c_add_user_table.py
Normal file
@@ -0,0 +1,38 @@
|
|||||||
|
"""add user table
|
||||||
|
|
||||||
|
Revision ID: bbafedfa510c
|
||||||
|
Revises: 5d6b9df9b045
|
||||||
|
Create Date: 2025-11-19 21:06:30.543262
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
from typing import Sequence, Union
|
||||||
|
|
||||||
|
import sqlalchemy as sa
|
||||||
|
from alembic import op
|
||||||
|
|
||||||
|
# revision identifiers, used by Alembic.
|
||||||
|
revision: str = "bbafedfa510c"
|
||||||
|
down_revision: Union[str, None] = "5d6b9df9b045"
|
||||||
|
branch_labels: Union[str, Sequence[str], None] = None
|
||||||
|
depends_on: Union[str, Sequence[str], None] = None
|
||||||
|
|
||||||
|
|
||||||
|
def upgrade() -> None:
|
||||||
|
op.create_table(
|
||||||
|
"user",
|
||||||
|
sa.Column("id", sa.String(), nullable=False),
|
||||||
|
sa.Column("email", sa.String(), nullable=False),
|
||||||
|
sa.Column("authentik_uid", sa.String(), nullable=False),
|
||||||
|
sa.Column("created_at", sa.DateTime(timezone=True), nullable=False),
|
||||||
|
sa.Column("updated_at", sa.DateTime(timezone=True), nullable=False),
|
||||||
|
sa.PrimaryKeyConstraint("id"),
|
||||||
|
)
|
||||||
|
|
||||||
|
with op.batch_alter_table("user", schema=None) as batch_op:
|
||||||
|
batch_op.create_index("idx_user_authentik_uid", ["authentik_uid"], unique=True)
|
||||||
|
batch_op.create_index("idx_user_email", ["email"], unique=False)
|
||||||
|
|
||||||
|
|
||||||
|
def downgrade() -> None:
|
||||||
|
op.drop_table("user")
|
||||||
@@ -6,8 +6,10 @@ from jose import JWTError, jwt
|
|||||||
from pydantic import BaseModel
|
from pydantic import BaseModel
|
||||||
|
|
||||||
from reflector.db.user_api_keys import user_api_keys_controller
|
from reflector.db.user_api_keys import user_api_keys_controller
|
||||||
|
from reflector.db.users import user_controller
|
||||||
from reflector.logger import logger
|
from reflector.logger import logger
|
||||||
from reflector.settings import settings
|
from reflector.settings import settings
|
||||||
|
from reflector.utils import generate_uuid4
|
||||||
|
|
||||||
oauth2_scheme = OAuth2PasswordBearer(tokenUrl="token", auto_error=False)
|
oauth2_scheme = OAuth2PasswordBearer(tokenUrl="token", auto_error=False)
|
||||||
api_key_header = APIKeyHeader(name="X-API-Key", auto_error=False)
|
api_key_header = APIKeyHeader(name="X-API-Key", auto_error=False)
|
||||||
@@ -74,9 +76,21 @@ async def _authenticate_user(
|
|||||||
if jwt_token:
|
if jwt_token:
|
||||||
try:
|
try:
|
||||||
payload = jwtauth.verify_token(jwt_token)
|
payload = jwtauth.verify_token(jwt_token)
|
||||||
sub = payload["sub"]
|
authentik_uid = payload["sub"]
|
||||||
email = payload["email"]
|
email = payload["email"]
|
||||||
user_infos.append(UserInfo(sub=sub, email=email))
|
|
||||||
|
user = await user_controller.get_by_authentik_uid(authentik_uid)
|
||||||
|
if not user:
|
||||||
|
logger.info(
|
||||||
|
f"Creating new user on first login: {authentik_uid} ({email})"
|
||||||
|
)
|
||||||
|
user = await user_controller.create_or_update(
|
||||||
|
id=generate_uuid4(),
|
||||||
|
authentik_uid=authentik_uid,
|
||||||
|
email=email,
|
||||||
|
)
|
||||||
|
|
||||||
|
user_infos.append(UserInfo(sub=user.id, email=email))
|
||||||
except JWTError as e:
|
except JWTError as e:
|
||||||
logger.error(f"JWT error: {e}")
|
logger.error(f"JWT error: {e}")
|
||||||
raise HTTPException(status_code=401, detail="Invalid authentication")
|
raise HTTPException(status_code=401, detail="Invalid authentication")
|
||||||
|
|||||||
@@ -40,6 +40,10 @@ class RoomProperties(BaseModel):
|
|||||||
)
|
)
|
||||||
enable_chat: bool = Field(default=True, description="Enable in-meeting chat")
|
enable_chat: bool = Field(default=True, description="Enable in-meeting chat")
|
||||||
enable_screenshare: bool = Field(default=True, description="Enable screen sharing")
|
enable_screenshare: bool = Field(default=True, description="Enable screen sharing")
|
||||||
|
enable_knocking: bool = Field(
|
||||||
|
default=False,
|
||||||
|
description="Enable knocking for private rooms (allows participants to request access)",
|
||||||
|
)
|
||||||
start_video_off: bool = Field(
|
start_video_off: bool = Field(
|
||||||
default=False, description="Start with video off for all participants"
|
default=False, description="Start with video off for all participants"
|
||||||
)
|
)
|
||||||
|
|||||||
@@ -68,7 +68,7 @@ class MeetingParticipant(BaseModel):
|
|||||||
Reference: https://docs.daily.co/reference/rest-api/meetings/get-meeting-participants
|
Reference: https://docs.daily.co/reference/rest-api/meetings/get-meeting-participants
|
||||||
"""
|
"""
|
||||||
|
|
||||||
user_id: NonEmptyString = Field(description="User identifier")
|
user_id: NonEmptyString | None = Field(None, description="User identifier")
|
||||||
participant_id: NonEmptyString = Field(description="Participant session identifier")
|
participant_id: NonEmptyString = Field(description="Participant session identifier")
|
||||||
user_name: NonEmptyString | None = Field(None, description="User display name")
|
user_name: NonEmptyString | None = Field(None, description="User display name")
|
||||||
join_time: int = Field(description="Join timestamp (Unix epoch seconds)")
|
join_time: int = Field(description="Join timestamp (Unix epoch seconds)")
|
||||||
|
|||||||
@@ -195,7 +195,6 @@ def parse_recording_error(event: DailyWebhookEvent) -> RecordingErrorPayload:
|
|||||||
return RecordingErrorPayload(**event.payload)
|
return RecordingErrorPayload(**event.payload)
|
||||||
|
|
||||||
|
|
||||||
# Webhook event type to parser mapping
|
|
||||||
WEBHOOK_PARSERS = {
|
WEBHOOK_PARSERS = {
|
||||||
"participant.joined": parse_participant_joined,
|
"participant.joined": parse_participant_joined,
|
||||||
"participant.left": parse_participant_left,
|
"participant.left": parse_participant_left,
|
||||||
|
|||||||
@@ -31,6 +31,7 @@ import reflector.db.recordings # noqa
|
|||||||
import reflector.db.rooms # noqa
|
import reflector.db.rooms # noqa
|
||||||
import reflector.db.transcripts # noqa
|
import reflector.db.transcripts # noqa
|
||||||
import reflector.db.user_api_keys # noqa
|
import reflector.db.user_api_keys # noqa
|
||||||
|
import reflector.db.users # noqa
|
||||||
|
|
||||||
kwargs = {}
|
kwargs = {}
|
||||||
if "postgres" not in settings.DATABASE_URL:
|
if "postgres" not in settings.DATABASE_URL:
|
||||||
|
|||||||
@@ -35,8 +35,15 @@ class Recording(BaseModel):
|
|||||||
status: Literal["pending", "processing", "completed", "failed"] = "pending"
|
status: Literal["pending", "processing", "completed", "failed"] = "pending"
|
||||||
meeting_id: str | None = None
|
meeting_id: str | None = None
|
||||||
# for multitrack reprocessing
|
# for multitrack reprocessing
|
||||||
|
# track_keys can be empty list [] if recording finished but no audio was captured (silence/muted)
|
||||||
|
# None means not a multitrack recording, [] means multitrack with no tracks
|
||||||
track_keys: list[str] | None = None
|
track_keys: list[str] | None = None
|
||||||
|
|
||||||
|
@property
|
||||||
|
def is_multitrack(self) -> bool:
|
||||||
|
"""True if recording has separate audio tracks (1+ tracks counts as multitrack)."""
|
||||||
|
return self.track_keys is not None and len(self.track_keys) > 0
|
||||||
|
|
||||||
|
|
||||||
class RecordingController:
|
class RecordingController:
|
||||||
async def create(self, recording: Recording):
|
async def create(self, recording: Recording):
|
||||||
|
|||||||
92
server/reflector/db/users.py
Normal file
92
server/reflector/db/users.py
Normal file
@@ -0,0 +1,92 @@
|
|||||||
|
"""User table for storing Authentik user information."""
|
||||||
|
|
||||||
|
from datetime import datetime, timezone
|
||||||
|
|
||||||
|
import sqlalchemy
|
||||||
|
from pydantic import BaseModel, Field
|
||||||
|
|
||||||
|
from reflector.db import get_database, metadata
|
||||||
|
from reflector.utils import generate_uuid4
|
||||||
|
from reflector.utils.string import NonEmptyString
|
||||||
|
|
||||||
|
users = sqlalchemy.Table(
|
||||||
|
"user",
|
||||||
|
metadata,
|
||||||
|
sqlalchemy.Column("id", sqlalchemy.String, primary_key=True),
|
||||||
|
sqlalchemy.Column("email", sqlalchemy.String, nullable=False),
|
||||||
|
sqlalchemy.Column("authentik_uid", sqlalchemy.String, nullable=False),
|
||||||
|
sqlalchemy.Column("created_at", sqlalchemy.DateTime(timezone=True), nullable=False),
|
||||||
|
sqlalchemy.Column("updated_at", sqlalchemy.DateTime(timezone=True), nullable=False),
|
||||||
|
sqlalchemy.Index("idx_user_authentik_uid", "authentik_uid", unique=True),
|
||||||
|
sqlalchemy.Index("idx_user_email", "email", unique=False),
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
class User(BaseModel):
|
||||||
|
id: NonEmptyString = Field(default_factory=generate_uuid4)
|
||||||
|
email: NonEmptyString
|
||||||
|
authentik_uid: NonEmptyString
|
||||||
|
created_at: datetime = Field(default_factory=lambda: datetime.now(timezone.utc))
|
||||||
|
updated_at: datetime = Field(default_factory=lambda: datetime.now(timezone.utc))
|
||||||
|
|
||||||
|
|
||||||
|
class UserController:
|
||||||
|
@staticmethod
|
||||||
|
async def get_by_id(user_id: NonEmptyString) -> User | None:
|
||||||
|
query = users.select().where(users.c.id == user_id)
|
||||||
|
result = await get_database().fetch_one(query)
|
||||||
|
return User(**result) if result else None
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
async def get_by_authentik_uid(authentik_uid: NonEmptyString) -> User | None:
|
||||||
|
query = users.select().where(users.c.authentik_uid == authentik_uid)
|
||||||
|
result = await get_database().fetch_one(query)
|
||||||
|
return User(**result) if result else None
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
async def get_by_email(email: NonEmptyString) -> User | None:
|
||||||
|
query = users.select().where(users.c.email == email)
|
||||||
|
result = await get_database().fetch_one(query)
|
||||||
|
return User(**result) if result else None
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
async def create_or_update(
|
||||||
|
id: NonEmptyString, authentik_uid: NonEmptyString, email: NonEmptyString
|
||||||
|
) -> User:
|
||||||
|
existing = await UserController.get_by_authentik_uid(authentik_uid)
|
||||||
|
now = datetime.now(timezone.utc)
|
||||||
|
|
||||||
|
if existing:
|
||||||
|
query = (
|
||||||
|
users.update()
|
||||||
|
.where(users.c.authentik_uid == authentik_uid)
|
||||||
|
.values(email=email, updated_at=now)
|
||||||
|
)
|
||||||
|
await get_database().execute(query)
|
||||||
|
return User(
|
||||||
|
id=existing.id,
|
||||||
|
authentik_uid=authentik_uid,
|
||||||
|
email=email,
|
||||||
|
created_at=existing.created_at,
|
||||||
|
updated_at=now,
|
||||||
|
)
|
||||||
|
else:
|
||||||
|
user = User(
|
||||||
|
id=id,
|
||||||
|
authentik_uid=authentik_uid,
|
||||||
|
email=email,
|
||||||
|
created_at=now,
|
||||||
|
updated_at=now,
|
||||||
|
)
|
||||||
|
query = users.insert().values(**user.model_dump())
|
||||||
|
await get_database().execute(query)
|
||||||
|
return user
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
async def list_all() -> list[User]:
|
||||||
|
query = users.select().order_by(users.c.created_at.desc())
|
||||||
|
results = await get_database().fetch_all(query)
|
||||||
|
return [User(**r) for r in results]
|
||||||
|
|
||||||
|
|
||||||
|
user_controller = UserController()
|
||||||
@@ -9,7 +9,10 @@ from av.audio.resampler import AudioResampler
|
|||||||
from celery import chain, shared_task
|
from celery import chain, shared_task
|
||||||
|
|
||||||
from reflector.asynctask import asynctask
|
from reflector.asynctask import asynctask
|
||||||
|
from reflector.dailyco_api import MeetingParticipantsResponse
|
||||||
from reflector.db.transcripts import (
|
from reflector.db.transcripts import (
|
||||||
|
Transcript,
|
||||||
|
TranscriptParticipant,
|
||||||
TranscriptStatus,
|
TranscriptStatus,
|
||||||
TranscriptWaveform,
|
TranscriptWaveform,
|
||||||
transcripts_controller,
|
transcripts_controller,
|
||||||
@@ -29,7 +32,12 @@ from reflector.processors.audio_waveform_processor import AudioWaveformProcessor
|
|||||||
from reflector.processors.types import TitleSummary
|
from reflector.processors.types import TitleSummary
|
||||||
from reflector.processors.types import Transcript as TranscriptType
|
from reflector.processors.types import Transcript as TranscriptType
|
||||||
from reflector.storage import Storage, get_transcripts_storage
|
from reflector.storage import Storage, get_transcripts_storage
|
||||||
|
from reflector.utils.daily import (
|
||||||
|
filter_cam_audio_tracks,
|
||||||
|
parse_daily_recording_filename,
|
||||||
|
)
|
||||||
from reflector.utils.string import NonEmptyString
|
from reflector.utils.string import NonEmptyString
|
||||||
|
from reflector.video_platforms.factory import create_platform_client
|
||||||
|
|
||||||
# Audio encoding constants
|
# Audio encoding constants
|
||||||
OPUS_STANDARD_SAMPLE_RATE = 48000
|
OPUS_STANDARD_SAMPLE_RATE = 48000
|
||||||
@@ -414,7 +422,15 @@ class PipelineMainMultitrack(PipelineMainBase):
|
|||||||
# Open all containers with cleanup guaranteed
|
# Open all containers with cleanup guaranteed
|
||||||
for i, url in enumerate(valid_track_urls):
|
for i, url in enumerate(valid_track_urls):
|
||||||
try:
|
try:
|
||||||
c = av.open(url)
|
c = av.open(
|
||||||
|
url,
|
||||||
|
options={
|
||||||
|
# it's trying to stream from s3 by default
|
||||||
|
"reconnect": "1",
|
||||||
|
"reconnect_streamed": "1",
|
||||||
|
"reconnect_delay_max": "5",
|
||||||
|
},
|
||||||
|
)
|
||||||
containers.append(c)
|
containers.append(c)
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
self.logger.warning(
|
self.logger.warning(
|
||||||
@@ -443,6 +459,8 @@ class PipelineMainMultitrack(PipelineMainBase):
|
|||||||
frame = next(dec)
|
frame = next(dec)
|
||||||
except StopIteration:
|
except StopIteration:
|
||||||
active[i] = False
|
active[i] = False
|
||||||
|
# causes stream to move on / unclogs memory
|
||||||
|
inputs[i].push(None)
|
||||||
continue
|
continue
|
||||||
|
|
||||||
if frame.sample_rate != target_sample_rate:
|
if frame.sample_rate != target_sample_rate:
|
||||||
@@ -462,8 +480,6 @@ class PipelineMainMultitrack(PipelineMainBase):
|
|||||||
mixed.time_base = Fraction(1, target_sample_rate)
|
mixed.time_base = Fraction(1, target_sample_rate)
|
||||||
await writer.push(mixed)
|
await writer.push(mixed)
|
||||||
|
|
||||||
for in_ctx in inputs:
|
|
||||||
in_ctx.push(None)
|
|
||||||
while True:
|
while True:
|
||||||
try:
|
try:
|
||||||
mixed = sink.pull()
|
mixed = sink.pull()
|
||||||
@@ -494,6 +510,90 @@ class PipelineMainMultitrack(PipelineMainBase):
|
|||||||
transcript=transcript, event="WAVEFORM", data=waveform
|
transcript=transcript, event="WAVEFORM", data=waveform
|
||||||
)
|
)
|
||||||
|
|
||||||
|
async def update_participants_from_daily(
|
||||||
|
self, transcript: Transcript, track_keys: list[str]
|
||||||
|
) -> None:
|
||||||
|
"""Update transcript participants with user_id and names from Daily.co API."""
|
||||||
|
if not transcript.recording_id:
|
||||||
|
return
|
||||||
|
|
||||||
|
try:
|
||||||
|
async with create_platform_client("daily") as daily_client:
|
||||||
|
id_to_name = {}
|
||||||
|
id_to_user_id = {}
|
||||||
|
|
||||||
|
try:
|
||||||
|
rec_details = await daily_client.get_recording(
|
||||||
|
transcript.recording_id
|
||||||
|
)
|
||||||
|
mtg_session_id = rec_details.mtgSessionId
|
||||||
|
if mtg_session_id:
|
||||||
|
try:
|
||||||
|
payload: MeetingParticipantsResponse = (
|
||||||
|
await daily_client.get_meeting_participants(
|
||||||
|
mtg_session_id
|
||||||
|
)
|
||||||
|
)
|
||||||
|
for p in payload.data:
|
||||||
|
pid = p.participant_id
|
||||||
|
name = p.user_name
|
||||||
|
user_id = p.user_id
|
||||||
|
if name:
|
||||||
|
id_to_name[pid] = name
|
||||||
|
if user_id:
|
||||||
|
id_to_user_id[pid] = user_id
|
||||||
|
except Exception as e:
|
||||||
|
self.logger.warning(
|
||||||
|
"Failed to fetch Daily meeting participants",
|
||||||
|
error=str(e),
|
||||||
|
mtg_session_id=mtg_session_id,
|
||||||
|
exc_info=True,
|
||||||
|
)
|
||||||
|
else:
|
||||||
|
self.logger.warning(
|
||||||
|
"No mtgSessionId found for recording; participant names may be generic",
|
||||||
|
recording_id=transcript.recording_id,
|
||||||
|
)
|
||||||
|
except Exception as e:
|
||||||
|
self.logger.warning(
|
||||||
|
"Failed to fetch Daily recording details",
|
||||||
|
error=str(e),
|
||||||
|
recording_id=transcript.recording_id,
|
||||||
|
exc_info=True,
|
||||||
|
)
|
||||||
|
return
|
||||||
|
|
||||||
|
cam_audio_keys = filter_cam_audio_tracks(track_keys)
|
||||||
|
|
||||||
|
for idx, key in enumerate(cam_audio_keys):
|
||||||
|
try:
|
||||||
|
parsed = parse_daily_recording_filename(key)
|
||||||
|
participant_id = parsed.participant_id
|
||||||
|
except ValueError as e:
|
||||||
|
self.logger.error(
|
||||||
|
"Failed to parse Daily recording filename",
|
||||||
|
error=str(e),
|
||||||
|
key=key,
|
||||||
|
exc_info=True,
|
||||||
|
)
|
||||||
|
continue
|
||||||
|
|
||||||
|
default_name = f"Speaker {idx}"
|
||||||
|
name = id_to_name.get(participant_id, default_name)
|
||||||
|
user_id = id_to_user_id.get(participant_id)
|
||||||
|
|
||||||
|
participant = TranscriptParticipant(
|
||||||
|
id=participant_id, speaker=idx, name=name, user_id=user_id
|
||||||
|
)
|
||||||
|
await transcripts_controller.upsert_participant(
|
||||||
|
transcript, participant
|
||||||
|
)
|
||||||
|
|
||||||
|
except Exception as e:
|
||||||
|
self.logger.warning(
|
||||||
|
"Failed to map participant names", error=str(e), exc_info=True
|
||||||
|
)
|
||||||
|
|
||||||
async def process(self, bucket_name: str, track_keys: list[str]):
|
async def process(self, bucket_name: str, track_keys: list[str]):
|
||||||
transcript = await self.get_transcript()
|
transcript = await self.get_transcript()
|
||||||
async with self.transaction():
|
async with self.transaction():
|
||||||
@@ -502,9 +602,12 @@ class PipelineMainMultitrack(PipelineMainBase):
|
|||||||
{
|
{
|
||||||
"events": [],
|
"events": [],
|
||||||
"topics": [],
|
"topics": [],
|
||||||
|
"participants": [],
|
||||||
},
|
},
|
||||||
)
|
)
|
||||||
|
|
||||||
|
await self.update_participants_from_daily(transcript, track_keys)
|
||||||
|
|
||||||
source_storage = get_transcripts_storage()
|
source_storage = get_transcripts_storage()
|
||||||
transcript_storage = source_storage
|
transcript_storage = source_storage
|
||||||
|
|
||||||
|
|||||||
@@ -1,6 +1,7 @@
|
|||||||
import io
|
import io
|
||||||
import re
|
import re
|
||||||
import tempfile
|
import tempfile
|
||||||
|
from collections import defaultdict
|
||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
from typing import Annotated, TypedDict
|
from typing import Annotated, TypedDict
|
||||||
|
|
||||||
@@ -16,6 +17,17 @@ class DiarizationSegment(TypedDict):
|
|||||||
|
|
||||||
|
|
||||||
PUNC_RE = re.compile(r"[.;:?!…]")
|
PUNC_RE = re.compile(r"[.;:?!…]")
|
||||||
|
SENTENCE_END_RE = re.compile(r"[.?!…]$")
|
||||||
|
|
||||||
|
# Max segment length for words_to_segments() - breaks on any punctuation (. ; : ? ! …)
|
||||||
|
# when segment exceeds this limit. Used for non-multitrack recordings.
|
||||||
|
MAX_SEGMENT_CHARS = 120
|
||||||
|
|
||||||
|
# Max segment length for words_to_segments_by_sentence() - only breaks on sentence-ending
|
||||||
|
# punctuation (. ? ! …) when segment exceeds this limit. Higher threshold allows complete
|
||||||
|
# sentences in multitrack recordings where speakers overlap.
|
||||||
|
# similar number to server/reflector/processors/transcript_liner.py
|
||||||
|
MAX_SENTENCE_SEGMENT_CHARS = 1000
|
||||||
|
|
||||||
|
|
||||||
class AudioFile(BaseModel):
|
class AudioFile(BaseModel):
|
||||||
@@ -76,7 +88,6 @@ def words_to_segments(words: list[Word]) -> list[TranscriptSegment]:
|
|||||||
# but separate if the speaker changes, or if the punctuation is a . , ; : ? !
|
# but separate if the speaker changes, or if the punctuation is a . , ; : ? !
|
||||||
segments = []
|
segments = []
|
||||||
current_segment = None
|
current_segment = None
|
||||||
MAX_SEGMENT_LENGTH = 120
|
|
||||||
|
|
||||||
for word in words:
|
for word in words:
|
||||||
if current_segment is None:
|
if current_segment is None:
|
||||||
@@ -106,7 +117,7 @@ def words_to_segments(words: list[Word]) -> list[TranscriptSegment]:
|
|||||||
current_segment.end = word.end
|
current_segment.end = word.end
|
||||||
|
|
||||||
have_punc = PUNC_RE.search(word.text)
|
have_punc = PUNC_RE.search(word.text)
|
||||||
if have_punc and (len(current_segment.text) > MAX_SEGMENT_LENGTH):
|
if have_punc and (len(current_segment.text) > MAX_SEGMENT_CHARS):
|
||||||
segments.append(current_segment)
|
segments.append(current_segment)
|
||||||
current_segment = None
|
current_segment = None
|
||||||
|
|
||||||
@@ -116,6 +127,70 @@ def words_to_segments(words: list[Word]) -> list[TranscriptSegment]:
|
|||||||
return segments
|
return segments
|
||||||
|
|
||||||
|
|
||||||
|
def words_to_segments_by_sentence(words: list[Word]) -> list[TranscriptSegment]:
|
||||||
|
"""Group words by speaker, then split into sentences.
|
||||||
|
|
||||||
|
For multitrack recordings where words from different speakers are interleaved
|
||||||
|
by timestamp, this function first groups all words by speaker, then creates
|
||||||
|
segments based on sentence boundaries within each speaker's words.
|
||||||
|
|
||||||
|
This produces cleaner output than words_to_segments() which breaks on every
|
||||||
|
speaker change, resulting in many tiny segments when speakers overlap.
|
||||||
|
"""
|
||||||
|
if not words:
|
||||||
|
return []
|
||||||
|
|
||||||
|
# Group words by speaker, preserving order within each speaker
|
||||||
|
by_speaker: dict[int, list[Word]] = defaultdict(list)
|
||||||
|
for w in words:
|
||||||
|
by_speaker[w.speaker].append(w)
|
||||||
|
|
||||||
|
segments: list[TranscriptSegment] = []
|
||||||
|
|
||||||
|
for speaker, speaker_words in by_speaker.items():
|
||||||
|
current_text = ""
|
||||||
|
current_start: float | None = None
|
||||||
|
current_end: float = 0.0
|
||||||
|
|
||||||
|
for word in speaker_words:
|
||||||
|
if current_start is None:
|
||||||
|
current_start = word.start
|
||||||
|
|
||||||
|
current_text += word.text
|
||||||
|
current_end = word.end
|
||||||
|
|
||||||
|
# Check for sentence end or max length
|
||||||
|
is_sentence_end = SENTENCE_END_RE.search(word.text.strip())
|
||||||
|
is_too_long = len(current_text) >= MAX_SENTENCE_SEGMENT_CHARS
|
||||||
|
|
||||||
|
if is_sentence_end or is_too_long:
|
||||||
|
segments.append(
|
||||||
|
TranscriptSegment(
|
||||||
|
text=current_text,
|
||||||
|
start=current_start,
|
||||||
|
end=current_end,
|
||||||
|
speaker=speaker,
|
||||||
|
)
|
||||||
|
)
|
||||||
|
current_text = ""
|
||||||
|
current_start = None
|
||||||
|
|
||||||
|
# Flush remaining words for this speaker
|
||||||
|
if current_text and current_start is not None:
|
||||||
|
segments.append(
|
||||||
|
TranscriptSegment(
|
||||||
|
text=current_text,
|
||||||
|
start=current_start,
|
||||||
|
end=current_end,
|
||||||
|
speaker=speaker,
|
||||||
|
)
|
||||||
|
)
|
||||||
|
|
||||||
|
# Sort segments by start time
|
||||||
|
segments.sort(key=lambda s: s.start)
|
||||||
|
return segments
|
||||||
|
|
||||||
|
|
||||||
class Transcript(BaseModel):
|
class Transcript(BaseModel):
|
||||||
translation: str | None = None
|
translation: str | None = None
|
||||||
words: list[Word] = []
|
words: list[Word] = []
|
||||||
@@ -154,7 +229,9 @@ class Transcript(BaseModel):
|
|||||||
word.start += offset
|
word.start += offset
|
||||||
word.end += offset
|
word.end += offset
|
||||||
|
|
||||||
def as_segments(self) -> list[TranscriptSegment]:
|
def as_segments(self, is_multitrack: bool = False) -> list[TranscriptSegment]:
|
||||||
|
if is_multitrack:
|
||||||
|
return words_to_segments_by_sentence(self.words)
|
||||||
return words_to_segments(self.words)
|
return words_to_segments(self.words)
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
17
server/reflector/schemas/transcript_formats.py
Normal file
17
server/reflector/schemas/transcript_formats.py
Normal file
@@ -0,0 +1,17 @@
|
|||||||
|
"""Schema definitions for transcript format types and segments."""
|
||||||
|
|
||||||
|
from typing import Literal
|
||||||
|
|
||||||
|
from pydantic import BaseModel
|
||||||
|
|
||||||
|
TranscriptFormat = Literal["text", "text-timestamped", "webvtt-named", "json"]
|
||||||
|
|
||||||
|
|
||||||
|
class TranscriptSegment(BaseModel):
|
||||||
|
"""A single transcript segment with speaker and timing information."""
|
||||||
|
|
||||||
|
speaker: int
|
||||||
|
speaker_name: str
|
||||||
|
text: str
|
||||||
|
start: float
|
||||||
|
end: float
|
||||||
168
server/reflector/services/transcript_process.py
Normal file
168
server/reflector/services/transcript_process.py
Normal file
@@ -0,0 +1,168 @@
|
|||||||
|
"""
|
||||||
|
Transcript processing service - shared logic for HTTP endpoints and Celery tasks.
|
||||||
|
|
||||||
|
This module provides result-based error handling that works in both contexts:
|
||||||
|
- HTTP endpoint: converts errors to HTTPException
|
||||||
|
- Celery task: converts errors to Exception
|
||||||
|
"""
|
||||||
|
|
||||||
|
from dataclasses import dataclass
|
||||||
|
from typing import Literal, Union, assert_never
|
||||||
|
|
||||||
|
import celery
|
||||||
|
from celery.result import AsyncResult
|
||||||
|
|
||||||
|
from reflector.db.recordings import recordings_controller
|
||||||
|
from reflector.db.transcripts import Transcript
|
||||||
|
from reflector.pipelines.main_file_pipeline import task_pipeline_file_process
|
||||||
|
from reflector.pipelines.main_multitrack_pipeline import (
|
||||||
|
task_pipeline_multitrack_process,
|
||||||
|
)
|
||||||
|
from reflector.utils.string import NonEmptyString
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class ProcessError:
|
||||||
|
detail: NonEmptyString
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class FileProcessingConfig:
|
||||||
|
transcript_id: NonEmptyString
|
||||||
|
mode: Literal["file"] = "file"
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class MultitrackProcessingConfig:
|
||||||
|
transcript_id: NonEmptyString
|
||||||
|
bucket_name: NonEmptyString
|
||||||
|
track_keys: list[str]
|
||||||
|
mode: Literal["multitrack"] = "multitrack"
|
||||||
|
|
||||||
|
|
||||||
|
ProcessingConfig = Union[FileProcessingConfig, MultitrackProcessingConfig]
|
||||||
|
PrepareResult = Union[ProcessingConfig, ProcessError]
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class ValidationOk:
|
||||||
|
# transcript currently doesnt always have recording_id
|
||||||
|
recording_id: NonEmptyString | None
|
||||||
|
transcript_id: NonEmptyString
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class ValidationLocked:
|
||||||
|
detail: NonEmptyString
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class ValidationNotReady:
|
||||||
|
detail: NonEmptyString
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class ValidationAlreadyScheduled:
|
||||||
|
detail: NonEmptyString
|
||||||
|
|
||||||
|
|
||||||
|
ValidationError = Union[
|
||||||
|
ValidationNotReady, ValidationLocked, ValidationAlreadyScheduled
|
||||||
|
]
|
||||||
|
ValidationResult = Union[ValidationOk, ValidationError]
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class DispatchOk:
|
||||||
|
status: Literal["ok"] = "ok"
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class DispatchAlreadyRunning:
|
||||||
|
status: Literal["already_running"] = "already_running"
|
||||||
|
|
||||||
|
|
||||||
|
DispatchResult = Union[
|
||||||
|
DispatchOk, DispatchAlreadyRunning, ProcessError, ValidationError
|
||||||
|
]
|
||||||
|
|
||||||
|
|
||||||
|
async def validate_transcript_for_processing(
|
||||||
|
transcript: Transcript,
|
||||||
|
) -> ValidationResult:
|
||||||
|
if transcript.locked:
|
||||||
|
return ValidationLocked(detail="Recording is locked")
|
||||||
|
|
||||||
|
if transcript.status == "idle":
|
||||||
|
return ValidationNotReady(detail="Recording is not ready for processing")
|
||||||
|
|
||||||
|
if task_is_scheduled_or_active(
|
||||||
|
"reflector.pipelines.main_file_pipeline.task_pipeline_file_process",
|
||||||
|
transcript_id=transcript.id,
|
||||||
|
) or task_is_scheduled_or_active(
|
||||||
|
"reflector.pipelines.main_multitrack_pipeline.task_pipeline_multitrack_process",
|
||||||
|
transcript_id=transcript.id,
|
||||||
|
):
|
||||||
|
return ValidationAlreadyScheduled(detail="already running")
|
||||||
|
|
||||||
|
return ValidationOk(
|
||||||
|
recording_id=transcript.recording_id, transcript_id=transcript.id
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
async def prepare_transcript_processing(validation: ValidationOk) -> PrepareResult:
|
||||||
|
"""
|
||||||
|
Determine processing mode from transcript/recording data.
|
||||||
|
"""
|
||||||
|
bucket_name: str | None = None
|
||||||
|
track_keys: list[str] | None = None
|
||||||
|
|
||||||
|
if validation.recording_id:
|
||||||
|
recording = await recordings_controller.get_by_id(validation.recording_id)
|
||||||
|
if recording:
|
||||||
|
bucket_name = recording.bucket_name
|
||||||
|
track_keys = recording.track_keys
|
||||||
|
|
||||||
|
if track_keys is not None and len(track_keys) == 0:
|
||||||
|
return ProcessError(
|
||||||
|
detail="No track keys found, must be either > 0 or None",
|
||||||
|
)
|
||||||
|
if track_keys is not None and not bucket_name:
|
||||||
|
return ProcessError(
|
||||||
|
detail="Bucket name must be specified",
|
||||||
|
)
|
||||||
|
|
||||||
|
if track_keys:
|
||||||
|
return MultitrackProcessingConfig(
|
||||||
|
bucket_name=bucket_name, # type: ignore (validated above)
|
||||||
|
track_keys=track_keys,
|
||||||
|
transcript_id=validation.transcript_id,
|
||||||
|
)
|
||||||
|
|
||||||
|
return FileProcessingConfig(
|
||||||
|
transcript_id=validation.transcript_id,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
def dispatch_transcript_processing(config: ProcessingConfig) -> AsyncResult:
|
||||||
|
if isinstance(config, MultitrackProcessingConfig):
|
||||||
|
return task_pipeline_multitrack_process.delay(
|
||||||
|
transcript_id=config.transcript_id,
|
||||||
|
bucket_name=config.bucket_name,
|
||||||
|
track_keys=config.track_keys,
|
||||||
|
)
|
||||||
|
elif isinstance(config, FileProcessingConfig):
|
||||||
|
return task_pipeline_file_process.delay(transcript_id=config.transcript_id)
|
||||||
|
else:
|
||||||
|
assert_never(config)
|
||||||
|
|
||||||
|
|
||||||
|
def task_is_scheduled_or_active(task_name: str, **kwargs):
|
||||||
|
inspect = celery.current_app.control.inspect()
|
||||||
|
|
||||||
|
for worker, tasks in (inspect.scheduled() | inspect.active()).items():
|
||||||
|
for task in tasks:
|
||||||
|
if task["name"] == task_name and task["kwargs"] == kwargs:
|
||||||
|
return True
|
||||||
|
|
||||||
|
return False
|
||||||
127
server/reflector/tools/process_transcript.py
Normal file
127
server/reflector/tools/process_transcript.py
Normal file
@@ -0,0 +1,127 @@
|
|||||||
|
"""
|
||||||
|
Process transcript by ID - auto-detects multitrack vs file pipeline.
|
||||||
|
|
||||||
|
Usage:
|
||||||
|
uv run -m reflector.tools.process_transcript <transcript_id>
|
||||||
|
|
||||||
|
# Or via docker:
|
||||||
|
docker compose exec server uv run -m reflector.tools.process_transcript <transcript_id>
|
||||||
|
"""
|
||||||
|
|
||||||
|
import argparse
|
||||||
|
import asyncio
|
||||||
|
import sys
|
||||||
|
import time
|
||||||
|
from typing import Callable
|
||||||
|
|
||||||
|
from celery.result import AsyncResult
|
||||||
|
|
||||||
|
from reflector.db.transcripts import Transcript, transcripts_controller
|
||||||
|
from reflector.services.transcript_process import (
|
||||||
|
FileProcessingConfig,
|
||||||
|
MultitrackProcessingConfig,
|
||||||
|
PrepareResult,
|
||||||
|
ProcessError,
|
||||||
|
ValidationError,
|
||||||
|
ValidationResult,
|
||||||
|
dispatch_transcript_processing,
|
||||||
|
prepare_transcript_processing,
|
||||||
|
validate_transcript_for_processing,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
async def process_transcript_inner(
|
||||||
|
transcript: Transcript,
|
||||||
|
on_validation: Callable[[ValidationResult], None],
|
||||||
|
on_preprocess: Callable[[PrepareResult], None],
|
||||||
|
) -> AsyncResult:
|
||||||
|
validation = await validate_transcript_for_processing(transcript)
|
||||||
|
on_validation(validation)
|
||||||
|
config = await prepare_transcript_processing(validation)
|
||||||
|
on_preprocess(config)
|
||||||
|
return dispatch_transcript_processing(config)
|
||||||
|
|
||||||
|
|
||||||
|
async def process_transcript(transcript_id: str, sync: bool = False) -> None:
|
||||||
|
"""
|
||||||
|
Process a transcript by ID, auto-detecting multitrack vs file pipeline.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
transcript_id: The transcript UUID
|
||||||
|
sync: If True, wait for task completion. If False, dispatch and exit.
|
||||||
|
"""
|
||||||
|
from reflector.db import get_database
|
||||||
|
|
||||||
|
database = get_database()
|
||||||
|
await database.connect()
|
||||||
|
|
||||||
|
try:
|
||||||
|
transcript = await transcripts_controller.get_by_id(transcript_id)
|
||||||
|
if not transcript:
|
||||||
|
print(f"Error: Transcript {transcript_id} not found", file=sys.stderr)
|
||||||
|
sys.exit(1)
|
||||||
|
|
||||||
|
print(f"Found transcript: {transcript.title or transcript_id}", file=sys.stderr)
|
||||||
|
print(f" Status: {transcript.status}", file=sys.stderr)
|
||||||
|
print(f" Recording ID: {transcript.recording_id or 'None'}", file=sys.stderr)
|
||||||
|
|
||||||
|
def on_validation(validation: ValidationResult) -> None:
|
||||||
|
if isinstance(validation, ValidationError):
|
||||||
|
print(f"Error: {validation.detail}", file=sys.stderr)
|
||||||
|
sys.exit(1)
|
||||||
|
|
||||||
|
def on_preprocess(config: PrepareResult) -> None:
|
||||||
|
if isinstance(config, ProcessError):
|
||||||
|
print(f"Error: {config.detail}", file=sys.stderr)
|
||||||
|
sys.exit(1)
|
||||||
|
elif isinstance(config, MultitrackProcessingConfig):
|
||||||
|
print(f"Dispatching multitrack pipeline", file=sys.stderr)
|
||||||
|
print(f" Bucket: {config.bucket_name}", file=sys.stderr)
|
||||||
|
print(f" Tracks: {len(config.track_keys)}", file=sys.stderr)
|
||||||
|
elif isinstance(config, FileProcessingConfig):
|
||||||
|
print(f"Dispatching file pipeline", file=sys.stderr)
|
||||||
|
|
||||||
|
result = await process_transcript_inner(
|
||||||
|
transcript, on_validation=on_validation, on_preprocess=on_preprocess
|
||||||
|
)
|
||||||
|
|
||||||
|
if sync:
|
||||||
|
print("Waiting for task completion...", file=sys.stderr)
|
||||||
|
while not result.ready():
|
||||||
|
print(f" Status: {result.state}", file=sys.stderr)
|
||||||
|
time.sleep(5)
|
||||||
|
|
||||||
|
if result.successful():
|
||||||
|
print("Task completed successfully", file=sys.stderr)
|
||||||
|
else:
|
||||||
|
print(f"Task failed: {result.result}", file=sys.stderr)
|
||||||
|
sys.exit(1)
|
||||||
|
else:
|
||||||
|
print(
|
||||||
|
"Task dispatched (use --sync to wait for completion)", file=sys.stderr
|
||||||
|
)
|
||||||
|
|
||||||
|
finally:
|
||||||
|
await database.disconnect()
|
||||||
|
|
||||||
|
|
||||||
|
def main():
|
||||||
|
parser = argparse.ArgumentParser(
|
||||||
|
description="Process transcript by ID - auto-detects multitrack vs file pipeline"
|
||||||
|
)
|
||||||
|
parser.add_argument(
|
||||||
|
"transcript_id",
|
||||||
|
help="Transcript UUID to process",
|
||||||
|
)
|
||||||
|
parser.add_argument(
|
||||||
|
"--sync",
|
||||||
|
action="store_true",
|
||||||
|
help="Wait for task completion instead of just dispatching",
|
||||||
|
)
|
||||||
|
|
||||||
|
args = parser.parse_args()
|
||||||
|
asyncio.run(process_transcript(args.transcript_id, sync=args.sync))
|
||||||
|
|
||||||
|
|
||||||
|
if __name__ == "__main__":
|
||||||
|
main()
|
||||||
@@ -64,6 +64,11 @@ def recording_lock_key(recording_id: NonEmptyString) -> NonEmptyString:
|
|||||||
return f"recording:{recording_id}"
|
return f"recording:{recording_id}"
|
||||||
|
|
||||||
|
|
||||||
|
def filter_cam_audio_tracks(track_keys: list[str]) -> list[str]:
|
||||||
|
"""Filter track keys to cam-audio tracks only (skip screen-audio, etc.)."""
|
||||||
|
return [k for k in track_keys if "cam-audio" in k]
|
||||||
|
|
||||||
|
|
||||||
def extract_base_room_name(daily_room_name: DailyRoomName) -> NonEmptyString:
|
def extract_base_room_name(daily_room_name: DailyRoomName) -> NonEmptyString:
|
||||||
"""
|
"""
|
||||||
Extract base room name from Daily.co timestamped room name.
|
Extract base room name from Daily.co timestamped room name.
|
||||||
|
|||||||
133
server/reflector/utils/transcript_formats.py
Normal file
133
server/reflector/utils/transcript_formats.py
Normal file
@@ -0,0 +1,133 @@
|
|||||||
|
"""Utilities for converting transcript data to various output formats."""
|
||||||
|
|
||||||
|
import webvtt
|
||||||
|
|
||||||
|
from reflector.db.transcripts import TranscriptParticipant, TranscriptTopic
|
||||||
|
from reflector.processors.types import (
|
||||||
|
Transcript as ProcessorTranscript,
|
||||||
|
)
|
||||||
|
from reflector.schemas.transcript_formats import TranscriptSegment
|
||||||
|
from reflector.utils.webvtt import seconds_to_timestamp
|
||||||
|
|
||||||
|
|
||||||
|
def get_speaker_name(
|
||||||
|
speaker: int, participants: list[TranscriptParticipant] | None
|
||||||
|
) -> str:
|
||||||
|
"""Get participant name for speaker or default to 'Speaker N'."""
|
||||||
|
if participants:
|
||||||
|
for participant in participants:
|
||||||
|
if participant.speaker == speaker:
|
||||||
|
return participant.name
|
||||||
|
return f"Speaker {speaker}"
|
||||||
|
|
||||||
|
|
||||||
|
def format_timestamp_mmss(seconds: float | int) -> str:
|
||||||
|
"""Format seconds as MM:SS timestamp."""
|
||||||
|
minutes = int(seconds // 60)
|
||||||
|
secs = int(seconds % 60)
|
||||||
|
return f"{minutes:02d}:{secs:02d}"
|
||||||
|
|
||||||
|
|
||||||
|
def transcript_to_text(
|
||||||
|
topics: list[TranscriptTopic],
|
||||||
|
participants: list[TranscriptParticipant] | None,
|
||||||
|
is_multitrack: bool = False,
|
||||||
|
) -> str:
|
||||||
|
"""Convert transcript topics to plain text with speaker names."""
|
||||||
|
lines = []
|
||||||
|
for topic in topics:
|
||||||
|
if not topic.words:
|
||||||
|
continue
|
||||||
|
|
||||||
|
transcript = ProcessorTranscript(words=topic.words)
|
||||||
|
segments = transcript.as_segments(is_multitrack)
|
||||||
|
|
||||||
|
for segment in segments:
|
||||||
|
speaker_name = get_speaker_name(segment.speaker, participants)
|
||||||
|
text = segment.text.strip()
|
||||||
|
lines.append(f"{speaker_name}: {text}")
|
||||||
|
|
||||||
|
return "\n".join(lines)
|
||||||
|
|
||||||
|
|
||||||
|
def transcript_to_text_timestamped(
|
||||||
|
topics: list[TranscriptTopic],
|
||||||
|
participants: list[TranscriptParticipant] | None,
|
||||||
|
is_multitrack: bool = False,
|
||||||
|
) -> str:
|
||||||
|
"""Convert transcript topics to timestamped text with speaker names."""
|
||||||
|
lines = []
|
||||||
|
for topic in topics:
|
||||||
|
if not topic.words:
|
||||||
|
continue
|
||||||
|
|
||||||
|
transcript = ProcessorTranscript(words=topic.words)
|
||||||
|
segments = transcript.as_segments(is_multitrack)
|
||||||
|
|
||||||
|
for segment in segments:
|
||||||
|
speaker_name = get_speaker_name(segment.speaker, participants)
|
||||||
|
timestamp = format_timestamp_mmss(segment.start)
|
||||||
|
text = segment.text.strip()
|
||||||
|
lines.append(f"[{timestamp}] {speaker_name}: {text}")
|
||||||
|
|
||||||
|
return "\n".join(lines)
|
||||||
|
|
||||||
|
|
||||||
|
def topics_to_webvtt_named(
|
||||||
|
topics: list[TranscriptTopic],
|
||||||
|
participants: list[TranscriptParticipant] | None,
|
||||||
|
is_multitrack: bool = False,
|
||||||
|
) -> str:
|
||||||
|
"""Convert transcript topics to WebVTT format with participant names."""
|
||||||
|
vtt = webvtt.WebVTT()
|
||||||
|
|
||||||
|
for topic in topics:
|
||||||
|
if not topic.words:
|
||||||
|
continue
|
||||||
|
|
||||||
|
transcript = ProcessorTranscript(words=topic.words)
|
||||||
|
segments = transcript.as_segments(is_multitrack)
|
||||||
|
|
||||||
|
for segment in segments:
|
||||||
|
speaker_name = get_speaker_name(segment.speaker, participants)
|
||||||
|
text = segment.text.strip()
|
||||||
|
text = f"<v {speaker_name}>{text}"
|
||||||
|
|
||||||
|
caption = webvtt.Caption(
|
||||||
|
start=seconds_to_timestamp(segment.start),
|
||||||
|
end=seconds_to_timestamp(segment.end),
|
||||||
|
text=text,
|
||||||
|
)
|
||||||
|
vtt.captions.append(caption)
|
||||||
|
|
||||||
|
return vtt.content
|
||||||
|
|
||||||
|
|
||||||
|
def transcript_to_json_segments(
|
||||||
|
topics: list[TranscriptTopic],
|
||||||
|
participants: list[TranscriptParticipant] | None,
|
||||||
|
is_multitrack: bool = False,
|
||||||
|
) -> list[TranscriptSegment]:
|
||||||
|
"""Convert transcript topics to a flat list of JSON segments."""
|
||||||
|
result = []
|
||||||
|
|
||||||
|
for topic in topics:
|
||||||
|
if not topic.words:
|
||||||
|
continue
|
||||||
|
|
||||||
|
transcript = ProcessorTranscript(words=topic.words)
|
||||||
|
segments = transcript.as_segments(is_multitrack)
|
||||||
|
|
||||||
|
for segment in segments:
|
||||||
|
speaker_name = get_speaker_name(segment.speaker, participants)
|
||||||
|
result.append(
|
||||||
|
TranscriptSegment(
|
||||||
|
speaker=segment.speaker,
|
||||||
|
speaker_name=speaker_name,
|
||||||
|
text=segment.text.strip(),
|
||||||
|
start=segment.start,
|
||||||
|
end=segment.end,
|
||||||
|
)
|
||||||
|
)
|
||||||
|
|
||||||
|
return result
|
||||||
@@ -13,7 +13,7 @@ VttTimestamp = Annotated[str, "vtt_timestamp"]
|
|||||||
WebVTTStr = Annotated[str, "webvtt_str"]
|
WebVTTStr = Annotated[str, "webvtt_str"]
|
||||||
|
|
||||||
|
|
||||||
def _seconds_to_timestamp(seconds: Seconds) -> VttTimestamp:
|
def seconds_to_timestamp(seconds: Seconds) -> VttTimestamp:
|
||||||
# lib doesn't do that
|
# lib doesn't do that
|
||||||
hours = int(seconds // 3600)
|
hours = int(seconds // 3600)
|
||||||
minutes = int((seconds % 3600) // 60)
|
minutes = int((seconds % 3600) // 60)
|
||||||
@@ -37,8 +37,8 @@ def words_to_webvtt(words: list[Word]) -> WebVTTStr:
|
|||||||
text = f"<v Speaker{segment.speaker}>{text}"
|
text = f"<v Speaker{segment.speaker}>{text}"
|
||||||
|
|
||||||
caption = webvtt.Caption(
|
caption = webvtt.Caption(
|
||||||
start=_seconds_to_timestamp(segment.start),
|
start=seconds_to_timestamp(segment.start),
|
||||||
end=_seconds_to_timestamp(segment.end),
|
end=seconds_to_timestamp(segment.end),
|
||||||
text=text,
|
text=text,
|
||||||
)
|
)
|
||||||
vtt.captions.append(caption)
|
vtt.captions.append(caption)
|
||||||
|
|||||||
@@ -31,6 +31,7 @@ class DailyClient(VideoPlatformClient):
|
|||||||
PLATFORM_NAME: Platform = "daily"
|
PLATFORM_NAME: Platform = "daily"
|
||||||
TIMESTAMP_FORMAT = "%Y%m%d%H%M%S"
|
TIMESTAMP_FORMAT = "%Y%m%d%H%M%S"
|
||||||
RECORDING_NONE: RecordingType = "none"
|
RECORDING_NONE: RecordingType = "none"
|
||||||
|
RECORDING_LOCAL: RecordingType = "local"
|
||||||
RECORDING_CLOUD: RecordingType = "cloud"
|
RECORDING_CLOUD: RecordingType = "cloud"
|
||||||
|
|
||||||
def __init__(self, config: VideoPlatformConfig):
|
def __init__(self, config: VideoPlatformConfig):
|
||||||
@@ -54,19 +55,23 @@ class DailyClient(VideoPlatformClient):
|
|||||||
timestamp = datetime.now().strftime(self.TIMESTAMP_FORMAT)
|
timestamp = datetime.now().strftime(self.TIMESTAMP_FORMAT)
|
||||||
room_name = f"{room_name_prefix}{ROOM_PREFIX_SEPARATOR}{timestamp}"
|
room_name = f"{room_name_prefix}{ROOM_PREFIX_SEPARATOR}{timestamp}"
|
||||||
|
|
||||||
|
enable_recording = None
|
||||||
|
if room.recording_type == self.RECORDING_LOCAL:
|
||||||
|
enable_recording = "local"
|
||||||
|
elif room.recording_type == self.RECORDING_CLOUD:
|
||||||
|
enable_recording = "raw-tracks"
|
||||||
|
|
||||||
properties = RoomProperties(
|
properties = RoomProperties(
|
||||||
enable_recording="raw-tracks"
|
enable_recording=enable_recording,
|
||||||
if room.recording_type != self.RECORDING_NONE
|
|
||||||
else False,
|
|
||||||
enable_chat=True,
|
enable_chat=True,
|
||||||
enable_screenshare=True,
|
enable_screenshare=True,
|
||||||
|
enable_knocking=room.is_locked,
|
||||||
start_video_off=False,
|
start_video_off=False,
|
||||||
start_audio_off=False,
|
start_audio_off=False,
|
||||||
exp=int(end_date.timestamp()),
|
exp=int(end_date.timestamp()),
|
||||||
)
|
)
|
||||||
|
|
||||||
# Only configure recordings_bucket if recording is enabled
|
if room.recording_type == self.RECORDING_CLOUD:
|
||||||
if room.recording_type != self.RECORDING_NONE:
|
|
||||||
daily_storage = get_dailyco_storage()
|
daily_storage = get_dailyco_storage()
|
||||||
assert daily_storage.bucket_name, "S3 bucket must be configured"
|
assert daily_storage.bucket_name, "S3 bucket must be configured"
|
||||||
properties.recordings_bucket = RecordingsBucketConfig(
|
properties.recordings_bucket = RecordingsBucketConfig(
|
||||||
@@ -172,16 +177,18 @@ class DailyClient(VideoPlatformClient):
|
|||||||
async def create_meeting_token(
|
async def create_meeting_token(
|
||||||
self,
|
self,
|
||||||
room_name: DailyRoomName,
|
room_name: DailyRoomName,
|
||||||
enable_recording: bool,
|
start_cloud_recording: bool,
|
||||||
user_id: str | None = None,
|
enable_recording_ui: bool,
|
||||||
) -> str:
|
user_id: NonEmptyString | None = None,
|
||||||
|
is_owner: bool = False,
|
||||||
|
) -> NonEmptyString:
|
||||||
properties = MeetingTokenProperties(
|
properties = MeetingTokenProperties(
|
||||||
room_name=room_name,
|
room_name=room_name,
|
||||||
user_id=user_id,
|
user_id=user_id,
|
||||||
start_cloud_recording=enable_recording,
|
start_cloud_recording=start_cloud_recording,
|
||||||
enable_recording_ui=not enable_recording,
|
enable_recording_ui=enable_recording_ui,
|
||||||
|
is_owner=is_owner,
|
||||||
)
|
)
|
||||||
|
|
||||||
request = CreateMeetingTokenRequest(properties=properties)
|
request = CreateMeetingTokenRequest(properties=properties)
|
||||||
result = await self._api_client.create_meeting_token(request)
|
result = await self._api_client.create_meeting_token(request)
|
||||||
return result.token
|
return result.token
|
||||||
|
|||||||
@@ -89,7 +89,7 @@ class CreateRoom(BaseModel):
|
|||||||
ics_url: Optional[str] = None
|
ics_url: Optional[str] = None
|
||||||
ics_fetch_interval: int = 300
|
ics_fetch_interval: int = 300
|
||||||
ics_enabled: bool = False
|
ics_enabled: bool = False
|
||||||
platform: Optional[Platform] = None
|
platform: Platform
|
||||||
|
|
||||||
|
|
||||||
class UpdateRoom(BaseModel):
|
class UpdateRoom(BaseModel):
|
||||||
@@ -310,6 +310,22 @@ async def rooms_create_meeting(
|
|||||||
room=room, current_time=current_time
|
room=room, current_time=current_time
|
||||||
)
|
)
|
||||||
|
|
||||||
|
if meeting is not None:
|
||||||
|
settings_match = (
|
||||||
|
meeting.is_locked == room.is_locked
|
||||||
|
and meeting.room_mode == room.room_mode
|
||||||
|
and meeting.recording_type == room.recording_type
|
||||||
|
and meeting.recording_trigger == room.recording_trigger
|
||||||
|
and meeting.platform == room.platform
|
||||||
|
)
|
||||||
|
if not settings_match:
|
||||||
|
logger.info(
|
||||||
|
f"Room settings changed for {room_name}, creating new meeting",
|
||||||
|
room_id=room.id,
|
||||||
|
old_meeting_id=meeting.id,
|
||||||
|
)
|
||||||
|
meeting = None
|
||||||
|
|
||||||
if meeting is None:
|
if meeting is None:
|
||||||
end_date = current_time + timedelta(hours=8)
|
end_date = current_time + timedelta(hours=8)
|
||||||
|
|
||||||
@@ -337,19 +353,7 @@ async def rooms_create_meeting(
|
|||||||
status_code=503, detail="Meeting creation in progress, please try again"
|
status_code=503, detail="Meeting creation in progress, please try again"
|
||||||
)
|
)
|
||||||
|
|
||||||
if meeting.platform == "daily" and room.recording_trigger != "none":
|
if user_id != room.user_id and meeting.platform == "whereby":
|
||||||
client = create_platform_client(meeting.platform)
|
|
||||||
token = await client.create_meeting_token(
|
|
||||||
meeting.room_name,
|
|
||||||
enable_recording=True,
|
|
||||||
user_id=user_id,
|
|
||||||
)
|
|
||||||
meeting = meeting.model_copy()
|
|
||||||
meeting.room_url = add_query_param(meeting.room_url, "t", token)
|
|
||||||
if meeting.host_room_url:
|
|
||||||
meeting.host_room_url = add_query_param(meeting.host_room_url, "t", token)
|
|
||||||
|
|
||||||
if user_id != room.user_id:
|
|
||||||
meeting.host_room_url = ""
|
meeting.host_room_url = ""
|
||||||
|
|
||||||
return meeting
|
return meeting
|
||||||
@@ -508,7 +512,8 @@ async def rooms_list_active_meetings(
|
|||||||
|
|
||||||
if user_id != room.user_id:
|
if user_id != room.user_id:
|
||||||
for meeting in meetings:
|
for meeting in meetings:
|
||||||
meeting.host_room_url = ""
|
if meeting.platform == "whereby":
|
||||||
|
meeting.host_room_url = ""
|
||||||
|
|
||||||
return meetings
|
return meetings
|
||||||
|
|
||||||
@@ -530,7 +535,7 @@ async def rooms_get_meeting(
|
|||||||
if not meeting:
|
if not meeting:
|
||||||
raise HTTPException(status_code=404, detail="Meeting not found")
|
raise HTTPException(status_code=404, detail="Meeting not found")
|
||||||
|
|
||||||
if user_id != room.user_id and not room.is_shared:
|
if user_id != room.user_id and not room.is_shared and meeting.platform == "whereby":
|
||||||
meeting.host_room_url = ""
|
meeting.host_room_url = ""
|
||||||
|
|
||||||
return meeting
|
return meeting
|
||||||
@@ -560,7 +565,16 @@ async def rooms_join_meeting(
|
|||||||
if meeting.end_date <= current_time:
|
if meeting.end_date <= current_time:
|
||||||
raise HTTPException(status_code=400, detail="Meeting has ended")
|
raise HTTPException(status_code=400, detail="Meeting has ended")
|
||||||
|
|
||||||
if user_id != room.user_id:
|
if meeting.platform == "daily" and user_id is not None:
|
||||||
meeting.host_room_url = ""
|
client = create_platform_client(meeting.platform)
|
||||||
|
token = await client.create_meeting_token(
|
||||||
|
meeting.room_name,
|
||||||
|
start_cloud_recording=meeting.recording_type == "cloud",
|
||||||
|
enable_recording_ui=meeting.recording_type == "local",
|
||||||
|
user_id=user_id,
|
||||||
|
is_owner=user_id == room.user_id,
|
||||||
|
)
|
||||||
|
meeting = meeting.model_copy()
|
||||||
|
meeting.room_url = add_query_param(meeting.room_url, "t", token)
|
||||||
|
|
||||||
return meeting
|
return meeting
|
||||||
|
|||||||
@@ -1,14 +1,22 @@
|
|||||||
from datetime import datetime, timedelta, timezone
|
from datetime import datetime, timedelta, timezone
|
||||||
from typing import Annotated, Literal, Optional
|
from typing import Annotated, Literal, Optional, assert_never
|
||||||
|
|
||||||
from fastapi import APIRouter, Depends, HTTPException, Query
|
from fastapi import APIRouter, Depends, HTTPException, Query
|
||||||
from fastapi_pagination import Page
|
from fastapi_pagination import Page
|
||||||
from fastapi_pagination.ext.databases import apaginate
|
from fastapi_pagination.ext.databases import apaginate
|
||||||
from jose import jwt
|
from jose import jwt
|
||||||
from pydantic import AwareDatetime, BaseModel, Field, constr, field_serializer
|
from pydantic import (
|
||||||
|
AwareDatetime,
|
||||||
|
BaseModel,
|
||||||
|
Discriminator,
|
||||||
|
Field,
|
||||||
|
constr,
|
||||||
|
field_serializer,
|
||||||
|
)
|
||||||
|
|
||||||
import reflector.auth as auth
|
import reflector.auth as auth
|
||||||
from reflector.db import get_database
|
from reflector.db import get_database
|
||||||
|
from reflector.db.recordings import recordings_controller
|
||||||
from reflector.db.search import (
|
from reflector.db.search import (
|
||||||
DEFAULT_SEARCH_LIMIT,
|
DEFAULT_SEARCH_LIMIT,
|
||||||
SearchLimit,
|
SearchLimit,
|
||||||
@@ -31,7 +39,14 @@ from reflector.db.transcripts import (
|
|||||||
)
|
)
|
||||||
from reflector.processors.types import Transcript as ProcessorTranscript
|
from reflector.processors.types import Transcript as ProcessorTranscript
|
||||||
from reflector.processors.types import Word
|
from reflector.processors.types import Word
|
||||||
|
from reflector.schemas.transcript_formats import TranscriptFormat, TranscriptSegment
|
||||||
from reflector.settings import settings
|
from reflector.settings import settings
|
||||||
|
from reflector.utils.transcript_formats import (
|
||||||
|
topics_to_webvtt_named,
|
||||||
|
transcript_to_json_segments,
|
||||||
|
transcript_to_text,
|
||||||
|
transcript_to_text_timestamped,
|
||||||
|
)
|
||||||
from reflector.ws_manager import get_ws_manager
|
from reflector.ws_manager import get_ws_manager
|
||||||
from reflector.zulip import (
|
from reflector.zulip import (
|
||||||
InvalidMessageError,
|
InvalidMessageError,
|
||||||
@@ -46,6 +61,14 @@ ALGORITHM = "HS256"
|
|||||||
DOWNLOAD_EXPIRE_MINUTES = 60
|
DOWNLOAD_EXPIRE_MINUTES = 60
|
||||||
|
|
||||||
|
|
||||||
|
async def _get_is_multitrack(transcript) -> bool:
|
||||||
|
"""Detect if transcript is from multitrack recording."""
|
||||||
|
if not transcript.recording_id:
|
||||||
|
return False
|
||||||
|
recording = await recordings_controller.get_by_id(transcript.recording_id)
|
||||||
|
return recording is not None and recording.is_multitrack
|
||||||
|
|
||||||
|
|
||||||
def create_access_token(data: dict, expires_delta: timedelta):
|
def create_access_token(data: dict, expires_delta: timedelta):
|
||||||
to_encode = data.copy()
|
to_encode = data.copy()
|
||||||
expire = datetime.now(timezone.utc) + expires_delta
|
expire = datetime.now(timezone.utc) + expires_delta
|
||||||
@@ -88,10 +111,84 @@ class GetTranscriptMinimal(BaseModel):
|
|||||||
audio_deleted: bool | None = None
|
audio_deleted: bool | None = None
|
||||||
|
|
||||||
|
|
||||||
class GetTranscript(GetTranscriptMinimal):
|
class GetTranscriptWithParticipants(GetTranscriptMinimal):
|
||||||
participants: list[TranscriptParticipant] | None
|
participants: list[TranscriptParticipant] | None
|
||||||
|
|
||||||
|
|
||||||
|
class GetTranscriptWithText(GetTranscriptWithParticipants):
|
||||||
|
"""
|
||||||
|
Transcript response with plain text format.
|
||||||
|
|
||||||
|
Format: Speaker names followed by their dialogue, one line per segment.
|
||||||
|
Example:
|
||||||
|
John Smith: Hello everyone
|
||||||
|
Jane Doe: Hi there
|
||||||
|
"""
|
||||||
|
|
||||||
|
transcript_format: Literal["text"] = "text"
|
||||||
|
transcript: str
|
||||||
|
|
||||||
|
|
||||||
|
class GetTranscriptWithTextTimestamped(GetTranscriptWithParticipants):
|
||||||
|
"""
|
||||||
|
Transcript response with timestamped text format.
|
||||||
|
|
||||||
|
Format: [MM:SS] timestamp prefix before each speaker and dialogue.
|
||||||
|
Example:
|
||||||
|
[00:00] John Smith: Hello everyone
|
||||||
|
[00:05] Jane Doe: Hi there
|
||||||
|
"""
|
||||||
|
|
||||||
|
transcript_format: Literal["text-timestamped"] = "text-timestamped"
|
||||||
|
transcript: str
|
||||||
|
|
||||||
|
|
||||||
|
class GetTranscriptWithWebVTTNamed(GetTranscriptWithParticipants):
|
||||||
|
"""
|
||||||
|
Transcript response in WebVTT subtitle format with participant names.
|
||||||
|
|
||||||
|
Format: Standard WebVTT with voice tags using participant names.
|
||||||
|
Example:
|
||||||
|
WEBVTT
|
||||||
|
|
||||||
|
00:00:00.000 --> 00:00:05.000
|
||||||
|
<v John Smith>Hello everyone
|
||||||
|
"""
|
||||||
|
|
||||||
|
transcript_format: Literal["webvtt-named"] = "webvtt-named"
|
||||||
|
transcript: str
|
||||||
|
|
||||||
|
|
||||||
|
class GetTranscriptWithJSON(GetTranscriptWithParticipants):
|
||||||
|
"""
|
||||||
|
Transcript response as structured JSON segments.
|
||||||
|
|
||||||
|
Format: Array of segment objects with speaker info, text, and timing.
|
||||||
|
Example:
|
||||||
|
[
|
||||||
|
{
|
||||||
|
"speaker": 0,
|
||||||
|
"speaker_name": "John Smith",
|
||||||
|
"text": "Hello everyone",
|
||||||
|
"start": 0.0,
|
||||||
|
"end": 5.0
|
||||||
|
}
|
||||||
|
]
|
||||||
|
"""
|
||||||
|
|
||||||
|
transcript_format: Literal["json"] = "json"
|
||||||
|
transcript: list[TranscriptSegment]
|
||||||
|
|
||||||
|
|
||||||
|
GetTranscript = Annotated[
|
||||||
|
GetTranscriptWithText
|
||||||
|
| GetTranscriptWithTextTimestamped
|
||||||
|
| GetTranscriptWithWebVTTNamed
|
||||||
|
| GetTranscriptWithJSON,
|
||||||
|
Discriminator("transcript_format"),
|
||||||
|
]
|
||||||
|
|
||||||
|
|
||||||
class CreateTranscript(BaseModel):
|
class CreateTranscript(BaseModel):
|
||||||
name: str
|
name: str
|
||||||
source_language: str = Field("en")
|
source_language: str = Field("en")
|
||||||
@@ -228,7 +325,7 @@ async def transcripts_search(
|
|||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@router.post("/transcripts", response_model=GetTranscript)
|
@router.post("/transcripts", response_model=GetTranscriptWithParticipants)
|
||||||
async def transcripts_create(
|
async def transcripts_create(
|
||||||
info: CreateTranscript,
|
info: CreateTranscript,
|
||||||
user: Annotated[Optional[auth.UserInfo], Depends(auth.current_user_optional)],
|
user: Annotated[Optional[auth.UserInfo], Depends(auth.current_user_optional)],
|
||||||
@@ -272,7 +369,7 @@ class GetTranscriptTopic(BaseModel):
|
|||||||
segments: list[GetTranscriptSegmentTopic] = []
|
segments: list[GetTranscriptSegmentTopic] = []
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
def from_transcript_topic(cls, topic: TranscriptTopic):
|
def from_transcript_topic(cls, topic: TranscriptTopic, is_multitrack: bool = False):
|
||||||
if not topic.words:
|
if not topic.words:
|
||||||
# In previous version, words were missing
|
# In previous version, words were missing
|
||||||
# Just output a segment with speaker 0
|
# Just output a segment with speaker 0
|
||||||
@@ -296,7 +393,7 @@ class GetTranscriptTopic(BaseModel):
|
|||||||
start=segment.start,
|
start=segment.start,
|
||||||
speaker=segment.speaker,
|
speaker=segment.speaker,
|
||||||
)
|
)
|
||||||
for segment in transcript.as_segments()
|
for segment in transcript.as_segments(is_multitrack)
|
||||||
]
|
]
|
||||||
return cls(
|
return cls(
|
||||||
id=topic.id,
|
id=topic.id,
|
||||||
@@ -313,8 +410,8 @@ class GetTranscriptTopicWithWords(GetTranscriptTopic):
|
|||||||
words: list[Word] = []
|
words: list[Word] = []
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
def from_transcript_topic(cls, topic: TranscriptTopic):
|
def from_transcript_topic(cls, topic: TranscriptTopic, is_multitrack: bool = False):
|
||||||
instance = super().from_transcript_topic(topic)
|
instance = super().from_transcript_topic(topic, is_multitrack)
|
||||||
if topic.words:
|
if topic.words:
|
||||||
instance.words = topic.words
|
instance.words = topic.words
|
||||||
return instance
|
return instance
|
||||||
@@ -329,8 +426,8 @@ class GetTranscriptTopicWithWordsPerSpeaker(GetTranscriptTopic):
|
|||||||
words_per_speaker: list[SpeakerWords] = []
|
words_per_speaker: list[SpeakerWords] = []
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
def from_transcript_topic(cls, topic: TranscriptTopic):
|
def from_transcript_topic(cls, topic: TranscriptTopic, is_multitrack: bool = False):
|
||||||
instance = super().from_transcript_topic(topic)
|
instance = super().from_transcript_topic(topic, is_multitrack)
|
||||||
if topic.words:
|
if topic.words:
|
||||||
words_per_speakers = []
|
words_per_speakers = []
|
||||||
# group words by speaker
|
# group words by speaker
|
||||||
@@ -362,14 +459,76 @@ class GetTranscriptTopicWithWordsPerSpeaker(GetTranscriptTopic):
|
|||||||
async def transcript_get(
|
async def transcript_get(
|
||||||
transcript_id: str,
|
transcript_id: str,
|
||||||
user: Annotated[Optional[auth.UserInfo], Depends(auth.current_user_optional)],
|
user: Annotated[Optional[auth.UserInfo], Depends(auth.current_user_optional)],
|
||||||
|
transcript_format: TranscriptFormat = "text",
|
||||||
):
|
):
|
||||||
user_id = user["sub"] if user else None
|
user_id = user["sub"] if user else None
|
||||||
return await transcripts_controller.get_by_id_for_http(
|
transcript = await transcripts_controller.get_by_id_for_http(
|
||||||
transcript_id, user_id=user_id
|
transcript_id, user_id=user_id
|
||||||
)
|
)
|
||||||
|
|
||||||
|
is_multitrack = await _get_is_multitrack(transcript)
|
||||||
|
|
||||||
@router.patch("/transcripts/{transcript_id}", response_model=GetTranscript)
|
base_data = {
|
||||||
|
"id": transcript.id,
|
||||||
|
"user_id": transcript.user_id,
|
||||||
|
"name": transcript.name,
|
||||||
|
"status": transcript.status,
|
||||||
|
"locked": transcript.locked,
|
||||||
|
"duration": transcript.duration,
|
||||||
|
"title": transcript.title,
|
||||||
|
"short_summary": transcript.short_summary,
|
||||||
|
"long_summary": transcript.long_summary,
|
||||||
|
"created_at": transcript.created_at,
|
||||||
|
"share_mode": transcript.share_mode,
|
||||||
|
"source_language": transcript.source_language,
|
||||||
|
"target_language": transcript.target_language,
|
||||||
|
"reviewed": transcript.reviewed,
|
||||||
|
"meeting_id": transcript.meeting_id,
|
||||||
|
"source_kind": transcript.source_kind,
|
||||||
|
"room_id": transcript.room_id,
|
||||||
|
"audio_deleted": transcript.audio_deleted,
|
||||||
|
"participants": transcript.participants,
|
||||||
|
}
|
||||||
|
|
||||||
|
if transcript_format == "text":
|
||||||
|
return GetTranscriptWithText(
|
||||||
|
**base_data,
|
||||||
|
transcript_format="text",
|
||||||
|
transcript=transcript_to_text(
|
||||||
|
transcript.topics, transcript.participants, is_multitrack
|
||||||
|
),
|
||||||
|
)
|
||||||
|
elif transcript_format == "text-timestamped":
|
||||||
|
return GetTranscriptWithTextTimestamped(
|
||||||
|
**base_data,
|
||||||
|
transcript_format="text-timestamped",
|
||||||
|
transcript=transcript_to_text_timestamped(
|
||||||
|
transcript.topics, transcript.participants, is_multitrack
|
||||||
|
),
|
||||||
|
)
|
||||||
|
elif transcript_format == "webvtt-named":
|
||||||
|
return GetTranscriptWithWebVTTNamed(
|
||||||
|
**base_data,
|
||||||
|
transcript_format="webvtt-named",
|
||||||
|
transcript=topics_to_webvtt_named(
|
||||||
|
transcript.topics, transcript.participants, is_multitrack
|
||||||
|
),
|
||||||
|
)
|
||||||
|
elif transcript_format == "json":
|
||||||
|
return GetTranscriptWithJSON(
|
||||||
|
**base_data,
|
||||||
|
transcript_format="json",
|
||||||
|
transcript=transcript_to_json_segments(
|
||||||
|
transcript.topics, transcript.participants, is_multitrack
|
||||||
|
),
|
||||||
|
)
|
||||||
|
else:
|
||||||
|
assert_never(transcript_format)
|
||||||
|
|
||||||
|
|
||||||
|
@router.patch(
|
||||||
|
"/transcripts/{transcript_id}", response_model=GetTranscriptWithParticipants
|
||||||
|
)
|
||||||
async def transcript_update(
|
async def transcript_update(
|
||||||
transcript_id: str,
|
transcript_id: str,
|
||||||
info: UpdateTranscript,
|
info: UpdateTranscript,
|
||||||
@@ -419,9 +578,12 @@ async def transcript_get_topics(
|
|||||||
transcript_id, user_id=user_id
|
transcript_id, user_id=user_id
|
||||||
)
|
)
|
||||||
|
|
||||||
|
is_multitrack = await _get_is_multitrack(transcript)
|
||||||
|
|
||||||
# convert to GetTranscriptTopic
|
# convert to GetTranscriptTopic
|
||||||
return [
|
return [
|
||||||
GetTranscriptTopic.from_transcript_topic(topic) for topic in transcript.topics
|
GetTranscriptTopic.from_transcript_topic(topic, is_multitrack)
|
||||||
|
for topic in transcript.topics
|
||||||
]
|
]
|
||||||
|
|
||||||
|
|
||||||
@@ -438,9 +600,11 @@ async def transcript_get_topics_with_words(
|
|||||||
transcript_id, user_id=user_id
|
transcript_id, user_id=user_id
|
||||||
)
|
)
|
||||||
|
|
||||||
|
is_multitrack = await _get_is_multitrack(transcript)
|
||||||
|
|
||||||
# convert to GetTranscriptTopicWithWords
|
# convert to GetTranscriptTopicWithWords
|
||||||
return [
|
return [
|
||||||
GetTranscriptTopicWithWords.from_transcript_topic(topic)
|
GetTranscriptTopicWithWords.from_transcript_topic(topic, is_multitrack)
|
||||||
for topic in transcript.topics
|
for topic in transcript.topics
|
||||||
]
|
]
|
||||||
|
|
||||||
@@ -459,13 +623,17 @@ async def transcript_get_topics_with_words_per_speaker(
|
|||||||
transcript_id, user_id=user_id
|
transcript_id, user_id=user_id
|
||||||
)
|
)
|
||||||
|
|
||||||
|
is_multitrack = await _get_is_multitrack(transcript)
|
||||||
|
|
||||||
# get the topic from the transcript
|
# get the topic from the transcript
|
||||||
topic = next((t for t in transcript.topics if t.id == topic_id), None)
|
topic = next((t for t in transcript.topics if t.id == topic_id), None)
|
||||||
if not topic:
|
if not topic:
|
||||||
raise HTTPException(status_code=404, detail="Topic not found")
|
raise HTTPException(status_code=404, detail="Topic not found")
|
||||||
|
|
||||||
# convert to GetTranscriptTopicWithWordsPerSpeaker
|
# convert to GetTranscriptTopicWithWordsPerSpeaker
|
||||||
return GetTranscriptTopicWithWordsPerSpeaker.from_transcript_topic(topic)
|
return GetTranscriptTopicWithWordsPerSpeaker.from_transcript_topic(
|
||||||
|
topic, is_multitrack
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
@router.post("/transcripts/{transcript_id}/zulip")
|
@router.post("/transcripts/{transcript_id}/zulip")
|
||||||
|
|||||||
@@ -1,15 +1,19 @@
|
|||||||
from typing import Annotated, Optional
|
from typing import Annotated, Optional, assert_never
|
||||||
|
|
||||||
import celery
|
|
||||||
from fastapi import APIRouter, Depends, HTTPException
|
from fastapi import APIRouter, Depends, HTTPException
|
||||||
from pydantic import BaseModel
|
from pydantic import BaseModel
|
||||||
|
|
||||||
import reflector.auth as auth
|
import reflector.auth as auth
|
||||||
from reflector.db.recordings import recordings_controller
|
|
||||||
from reflector.db.transcripts import transcripts_controller
|
from reflector.db.transcripts import transcripts_controller
|
||||||
from reflector.pipelines.main_file_pipeline import task_pipeline_file_process
|
from reflector.services.transcript_process import (
|
||||||
from reflector.pipelines.main_multitrack_pipeline import (
|
ProcessError,
|
||||||
task_pipeline_multitrack_process,
|
ValidationAlreadyScheduled,
|
||||||
|
ValidationError,
|
||||||
|
ValidationLocked,
|
||||||
|
ValidationOk,
|
||||||
|
dispatch_transcript_processing,
|
||||||
|
prepare_transcript_processing,
|
||||||
|
validate_transcript_for_processing,
|
||||||
)
|
)
|
||||||
|
|
||||||
router = APIRouter()
|
router = APIRouter()
|
||||||
@@ -23,68 +27,28 @@ class ProcessStatus(BaseModel):
|
|||||||
async def transcript_process(
|
async def transcript_process(
|
||||||
transcript_id: str,
|
transcript_id: str,
|
||||||
user: Annotated[Optional[auth.UserInfo], Depends(auth.current_user_optional)],
|
user: Annotated[Optional[auth.UserInfo], Depends(auth.current_user_optional)],
|
||||||
):
|
) -> ProcessStatus:
|
||||||
user_id = user["sub"] if user else None
|
user_id = user["sub"] if user else None
|
||||||
transcript = await transcripts_controller.get_by_id_for_http(
|
transcript = await transcripts_controller.get_by_id_for_http(
|
||||||
transcript_id, user_id=user_id
|
transcript_id, user_id=user_id
|
||||||
)
|
)
|
||||||
|
|
||||||
if transcript.locked:
|
validation = await validate_transcript_for_processing(transcript)
|
||||||
raise HTTPException(status_code=400, detail="Transcript is locked")
|
if isinstance(validation, ValidationLocked):
|
||||||
|
raise HTTPException(status_code=400, detail=validation.detail)
|
||||||
if transcript.status == "idle":
|
elif isinstance(validation, ValidationError):
|
||||||
raise HTTPException(
|
raise HTTPException(status_code=400, detail=validation.detail)
|
||||||
status_code=400, detail="Recording is not ready for processing"
|
elif isinstance(validation, ValidationAlreadyScheduled):
|
||||||
)
|
return ProcessStatus(status=validation.detail)
|
||||||
|
elif isinstance(validation, ValidationOk):
|
||||||
# avoid duplicate scheduling for either pipeline
|
pass
|
||||||
if task_is_scheduled_or_active(
|
|
||||||
"reflector.pipelines.main_file_pipeline.task_pipeline_file_process",
|
|
||||||
transcript_id=transcript_id,
|
|
||||||
) or task_is_scheduled_or_active(
|
|
||||||
"reflector.pipelines.main_multitrack_pipeline.task_pipeline_multitrack_process",
|
|
||||||
transcript_id=transcript_id,
|
|
||||||
):
|
|
||||||
return ProcessStatus(status="already running")
|
|
||||||
|
|
||||||
# Determine processing mode strictly from DB to avoid S3 scans
|
|
||||||
bucket_name = None
|
|
||||||
track_keys: list[str] = []
|
|
||||||
|
|
||||||
if transcript.recording_id:
|
|
||||||
recording = await recordings_controller.get_by_id(transcript.recording_id)
|
|
||||||
if recording:
|
|
||||||
bucket_name = recording.bucket_name
|
|
||||||
track_keys = recording.track_keys
|
|
||||||
if track_keys is not None and len(track_keys) == 0:
|
|
||||||
raise HTTPException(
|
|
||||||
status_code=500,
|
|
||||||
detail="No track keys found, must be either > 0 or None",
|
|
||||||
)
|
|
||||||
if track_keys is not None and not bucket_name:
|
|
||||||
raise HTTPException(
|
|
||||||
status_code=500, detail="Bucket name must be specified"
|
|
||||||
)
|
|
||||||
|
|
||||||
if track_keys:
|
|
||||||
task_pipeline_multitrack_process.delay(
|
|
||||||
transcript_id=transcript_id,
|
|
||||||
bucket_name=bucket_name,
|
|
||||||
track_keys=track_keys,
|
|
||||||
)
|
|
||||||
else:
|
else:
|
||||||
# Default single-file pipeline
|
assert_never(validation)
|
||||||
task_pipeline_file_process.delay(transcript_id=transcript_id)
|
|
||||||
|
|
||||||
return ProcessStatus(status="ok")
|
config = await prepare_transcript_processing(validation)
|
||||||
|
|
||||||
|
if isinstance(config, ProcessError):
|
||||||
def task_is_scheduled_or_active(task_name: str, **kwargs):
|
raise HTTPException(status_code=500, detail=config.detail)
|
||||||
inspect = celery.current_app.control.inspect()
|
else:
|
||||||
|
dispatch_transcript_processing(config)
|
||||||
for worker, tasks in (inspect.scheduled() | inspect.active()).items():
|
return ProcessStatus(status="ok")
|
||||||
for task in tasks:
|
|
||||||
if task["name"] == task_name and task["kwargs"] == kwargs:
|
|
||||||
return True
|
|
||||||
|
|
||||||
return False
|
|
||||||
|
|||||||
@@ -3,6 +3,7 @@ from typing import Optional
|
|||||||
from fastapi import APIRouter, WebSocket
|
from fastapi import APIRouter, WebSocket
|
||||||
|
|
||||||
from reflector.auth.auth_jwt import JWTAuth # type: ignore
|
from reflector.auth.auth_jwt import JWTAuth # type: ignore
|
||||||
|
from reflector.db.users import user_controller
|
||||||
from reflector.ws_manager import get_ws_manager
|
from reflector.ws_manager import get_ws_manager
|
||||||
|
|
||||||
router = APIRouter()
|
router = APIRouter()
|
||||||
@@ -29,7 +30,18 @@ async def user_events_websocket(websocket: WebSocket):
|
|||||||
|
|
||||||
try:
|
try:
|
||||||
payload = JWTAuth().verify_token(token)
|
payload = JWTAuth().verify_token(token)
|
||||||
user_id = payload.get("sub")
|
authentik_uid = payload.get("sub")
|
||||||
|
|
||||||
|
if authentik_uid:
|
||||||
|
user = await user_controller.get_by_authentik_uid(authentik_uid)
|
||||||
|
if user:
|
||||||
|
user_id = user.id
|
||||||
|
else:
|
||||||
|
await websocket.close(code=UNAUTHORISED)
|
||||||
|
return
|
||||||
|
else:
|
||||||
|
await websocket.close(code=UNAUTHORISED)
|
||||||
|
return
|
||||||
except Exception:
|
except Exception:
|
||||||
await websocket.close(code=UNAUTHORISED)
|
await websocket.close(code=UNAUTHORISED)
|
||||||
return
|
return
|
||||||
|
|||||||
@@ -2,6 +2,7 @@ import json
|
|||||||
import os
|
import os
|
||||||
import re
|
import re
|
||||||
from datetime import datetime, timezone
|
from datetime import datetime, timezone
|
||||||
|
from typing import List
|
||||||
from urllib.parse import unquote
|
from urllib.parse import unquote
|
||||||
|
|
||||||
import av
|
import av
|
||||||
@@ -11,7 +12,7 @@ from celery import shared_task
|
|||||||
from celery.utils.log import get_task_logger
|
from celery.utils.log import get_task_logger
|
||||||
from pydantic import ValidationError
|
from pydantic import ValidationError
|
||||||
|
|
||||||
from reflector.dailyco_api import MeetingParticipantsResponse
|
from reflector.dailyco_api import RecordingResponse
|
||||||
from reflector.db.daily_participant_sessions import (
|
from reflector.db.daily_participant_sessions import (
|
||||||
DailyParticipantSession,
|
DailyParticipantSession,
|
||||||
daily_participant_sessions_controller,
|
daily_participant_sessions_controller,
|
||||||
@@ -21,7 +22,6 @@ from reflector.db.recordings import Recording, recordings_controller
|
|||||||
from reflector.db.rooms import rooms_controller
|
from reflector.db.rooms import rooms_controller
|
||||||
from reflector.db.transcripts import (
|
from reflector.db.transcripts import (
|
||||||
SourceKind,
|
SourceKind,
|
||||||
TranscriptParticipant,
|
|
||||||
transcripts_controller,
|
transcripts_controller,
|
||||||
)
|
)
|
||||||
from reflector.pipelines.main_file_pipeline import task_pipeline_file_process
|
from reflector.pipelines.main_file_pipeline import task_pipeline_file_process
|
||||||
@@ -38,7 +38,7 @@ from reflector.storage import get_transcripts_storage
|
|||||||
from reflector.utils.daily import (
|
from reflector.utils.daily import (
|
||||||
DailyRoomName,
|
DailyRoomName,
|
||||||
extract_base_room_name,
|
extract_base_room_name,
|
||||||
parse_daily_recording_filename,
|
filter_cam_audio_tracks,
|
||||||
recording_lock_key,
|
recording_lock_key,
|
||||||
)
|
)
|
||||||
from reflector.video_platforms.factory import create_platform_client
|
from reflector.video_platforms.factory import create_platform_client
|
||||||
@@ -273,15 +273,7 @@ async def _process_multitrack_recording_inner(
|
|||||||
# else: Recording already exists; metadata set at creation time
|
# else: Recording already exists; metadata set at creation time
|
||||||
|
|
||||||
transcript = await transcripts_controller.get_by_recording_id(recording.id)
|
transcript = await transcripts_controller.get_by_recording_id(recording.id)
|
||||||
if transcript:
|
if not transcript:
|
||||||
await transcripts_controller.update(
|
|
||||||
transcript,
|
|
||||||
{
|
|
||||||
"topics": [],
|
|
||||||
"participants": [],
|
|
||||||
},
|
|
||||||
)
|
|
||||||
else:
|
|
||||||
transcript = await transcripts_controller.add(
|
transcript = await transcripts_controller.add(
|
||||||
"",
|
"",
|
||||||
source_kind=SourceKind.ROOM,
|
source_kind=SourceKind.ROOM,
|
||||||
@@ -294,79 +286,10 @@ async def _process_multitrack_recording_inner(
|
|||||||
room_id=room.id,
|
room_id=room.id,
|
||||||
)
|
)
|
||||||
|
|
||||||
try:
|
|
||||||
async with create_platform_client("daily") as daily_client:
|
|
||||||
id_to_name = {}
|
|
||||||
id_to_user_id = {}
|
|
||||||
|
|
||||||
try:
|
|
||||||
rec_details = await daily_client.get_recording(recording_id)
|
|
||||||
mtg_session_id = rec_details.mtgSessionId
|
|
||||||
if mtg_session_id:
|
|
||||||
try:
|
|
||||||
payload: MeetingParticipantsResponse = (
|
|
||||||
await daily_client.get_meeting_participants(mtg_session_id)
|
|
||||||
)
|
|
||||||
for p in payload.data:
|
|
||||||
pid = p.participant_id
|
|
||||||
assert (
|
|
||||||
pid is not None
|
|
||||||
), "panic! participant id cannot be None"
|
|
||||||
name = p.user_name
|
|
||||||
user_id = p.user_id
|
|
||||||
if name:
|
|
||||||
id_to_name[pid] = name
|
|
||||||
if user_id:
|
|
||||||
id_to_user_id[pid] = user_id
|
|
||||||
except Exception as e:
|
|
||||||
logger.warning(
|
|
||||||
"Failed to fetch Daily meeting participants",
|
|
||||||
error=str(e),
|
|
||||||
mtg_session_id=mtg_session_id,
|
|
||||||
exc_info=True,
|
|
||||||
)
|
|
||||||
else:
|
|
||||||
logger.warning(
|
|
||||||
"No mtgSessionId found for recording; participant names may be generic",
|
|
||||||
recording_id=recording_id,
|
|
||||||
)
|
|
||||||
except Exception as e:
|
|
||||||
logger.warning(
|
|
||||||
"Failed to fetch Daily recording details",
|
|
||||||
error=str(e),
|
|
||||||
recording_id=recording_id,
|
|
||||||
exc_info=True,
|
|
||||||
)
|
|
||||||
|
|
||||||
for idx, key in enumerate(track_keys):
|
|
||||||
try:
|
|
||||||
parsed = parse_daily_recording_filename(key)
|
|
||||||
participant_id = parsed.participant_id
|
|
||||||
except ValueError as e:
|
|
||||||
logger.error(
|
|
||||||
"Failed to parse Daily recording filename",
|
|
||||||
error=str(e),
|
|
||||||
key=key,
|
|
||||||
exc_info=True,
|
|
||||||
)
|
|
||||||
continue
|
|
||||||
|
|
||||||
default_name = f"Speaker {idx}"
|
|
||||||
name = id_to_name.get(participant_id, default_name)
|
|
||||||
user_id = id_to_user_id.get(participant_id)
|
|
||||||
|
|
||||||
participant = TranscriptParticipant(
|
|
||||||
id=participant_id, speaker=idx, name=name, user_id=user_id
|
|
||||||
)
|
|
||||||
await transcripts_controller.upsert_participant(transcript, participant)
|
|
||||||
|
|
||||||
except Exception as e:
|
|
||||||
logger.warning("Failed to map participant names", error=str(e), exc_info=True)
|
|
||||||
|
|
||||||
task_pipeline_multitrack_process.delay(
|
task_pipeline_multitrack_process.delay(
|
||||||
transcript_id=transcript.id,
|
transcript_id=transcript.id,
|
||||||
bucket_name=bucket_name,
|
bucket_name=bucket_name,
|
||||||
track_keys=track_keys,
|
track_keys=filter_cam_audio_tracks(track_keys),
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@@ -391,7 +314,7 @@ async def poll_daily_recordings():
|
|||||||
|
|
||||||
async with create_platform_client("daily") as daily_client:
|
async with create_platform_client("daily") as daily_client:
|
||||||
# latest 100. TODO cursor-based state
|
# latest 100. TODO cursor-based state
|
||||||
api_recordings = await daily_client.list_recordings()
|
api_recordings: List[RecordingResponse] = await daily_client.list_recordings()
|
||||||
|
|
||||||
if not api_recordings:
|
if not api_recordings:
|
||||||
logger.debug(
|
logger.debug(
|
||||||
@@ -422,17 +345,19 @@ async def poll_daily_recordings():
|
|||||||
|
|
||||||
for recording in missing_recordings:
|
for recording in missing_recordings:
|
||||||
if not recording.tracks:
|
if not recording.tracks:
|
||||||
assert recording.status != "finished", (
|
if recording.status == "finished":
|
||||||
f"Recording {recording.id} has status='finished' but no tracks. "
|
logger.warning(
|
||||||
f"Daily.co API guarantees finished recordings have tracks available. "
|
"Finished recording has no tracks (no audio captured)",
|
||||||
f"room_name={recording.room_name}"
|
recording_id=recording.id,
|
||||||
)
|
room_name=recording.room_name,
|
||||||
logger.debug(
|
)
|
||||||
"No tracks in recording yet",
|
else:
|
||||||
recording_id=recording.id,
|
logger.debug(
|
||||||
room_name=recording.room_name,
|
"No tracks in recording yet",
|
||||||
status=recording.status,
|
recording_id=recording.id,
|
||||||
)
|
room_name=recording.room_name,
|
||||||
|
status=recording.status,
|
||||||
|
)
|
||||||
continue
|
continue
|
||||||
|
|
||||||
track_keys = [t.s3Key for t in recording.tracks if t.type == "audio"]
|
track_keys = [t.s3Key for t in recording.tracks if t.type == "audio"]
|
||||||
|
|||||||
292
server/scripts/migrate_user_ids.py
Executable file
292
server/scripts/migrate_user_ids.py
Executable file
@@ -0,0 +1,292 @@
|
|||||||
|
#!/usr/bin/env python3
|
||||||
|
"""
|
||||||
|
Manual Migration Script: Migrate user_id from Authentik UID to internal user.id
|
||||||
|
|
||||||
|
This script should be run manually AFTER applying the database schema migrations.
|
||||||
|
|
||||||
|
Usage:
|
||||||
|
AUTHENTIK_API_URL=https://your-authentik-url \
|
||||||
|
AUTHENTIK_API_TOKEN=your-token \
|
||||||
|
DATABASE_URL=postgresql://... \
|
||||||
|
python scripts/migrate_user_ids.py
|
||||||
|
|
||||||
|
What this script does:
|
||||||
|
1. Collects all unique Authentik UIDs currently used in the database
|
||||||
|
2. Fetches only those users from Authentik API to populate the users table
|
||||||
|
3. Updates user_id in: user_api_key, transcript, room, meeting_consent
|
||||||
|
4. Uses user.authentik_uid to lookup the corresponding user.id
|
||||||
|
|
||||||
|
The script is idempotent:
|
||||||
|
- User inserts use ON CONFLICT DO NOTHING (safe if users already exist)
|
||||||
|
- Update queries only match authentik_uid->uuid pairs (no-op if already migrated)
|
||||||
|
- Safe to run multiple times without side effects
|
||||||
|
|
||||||
|
Prerequisites:
|
||||||
|
- AUTHENTIK_API_URL environment variable must be set
|
||||||
|
- AUTHENTIK_API_TOKEN environment variable must be set
|
||||||
|
- DATABASE_URL environment variable must be set
|
||||||
|
- Authentik API must be accessible
|
||||||
|
"""
|
||||||
|
|
||||||
|
import asyncio
|
||||||
|
import os
|
||||||
|
import sys
|
||||||
|
from datetime import datetime, timezone
|
||||||
|
from typing import Any
|
||||||
|
|
||||||
|
import httpx
|
||||||
|
from sqlalchemy import text
|
||||||
|
from sqlalchemy.ext.asyncio import AsyncConnection, create_async_engine
|
||||||
|
|
||||||
|
TABLES_WITH_USER_ID = ["user_api_key", "transcript", "room", "meeting_consent"]
|
||||||
|
NULLABLE_USER_ID_TABLES = {"transcript", "meeting_consent"}
|
||||||
|
AUTHENTIK_PAGE_SIZE = 100
|
||||||
|
HTTP_TIMEOUT = 30.0
|
||||||
|
|
||||||
|
|
||||||
|
class AuthentikClient:
|
||||||
|
def __init__(self, api_url: str, api_token: str):
|
||||||
|
self.api_url = api_url
|
||||||
|
self.api_token = api_token
|
||||||
|
|
||||||
|
def _get_headers(self) -> dict[str, str]:
|
||||||
|
return {
|
||||||
|
"Authorization": f"Bearer {self.api_token}",
|
||||||
|
"Accept": "application/json",
|
||||||
|
}
|
||||||
|
|
||||||
|
async def fetch_all_users(self) -> list[dict[str, Any]]:
|
||||||
|
all_users = []
|
||||||
|
page = 1
|
||||||
|
|
||||||
|
try:
|
||||||
|
async with httpx.AsyncClient(timeout=HTTP_TIMEOUT) as client:
|
||||||
|
while True:
|
||||||
|
url = f"{self.api_url}/api/v3/core/users/"
|
||||||
|
params = {
|
||||||
|
"page": page,
|
||||||
|
"page_size": AUTHENTIK_PAGE_SIZE,
|
||||||
|
"include_groups": "false",
|
||||||
|
}
|
||||||
|
|
||||||
|
print(f" Fetching users from Authentik (page {page})...")
|
||||||
|
response = await client.get(
|
||||||
|
url, headers=self._get_headers(), params=params
|
||||||
|
)
|
||||||
|
response.raise_for_status()
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
results = data.get("results", [])
|
||||||
|
if not results:
|
||||||
|
break
|
||||||
|
|
||||||
|
all_users.extend(results)
|
||||||
|
print(f" Fetched {len(results)} users from page {page}")
|
||||||
|
|
||||||
|
if not data.get("next"):
|
||||||
|
break
|
||||||
|
|
||||||
|
page += 1
|
||||||
|
|
||||||
|
print(f" Total: {len(all_users)} users fetched from Authentik")
|
||||||
|
return all_users
|
||||||
|
|
||||||
|
except httpx.HTTPError as e:
|
||||||
|
raise Exception(f"Failed to fetch users from Authentik: {e}") from e
|
||||||
|
|
||||||
|
|
||||||
|
async def collect_used_authentik_uids(connection: AsyncConnection) -> set[str]:
|
||||||
|
print("\nStep 1: Collecting Authentik UIDs from database tables...")
|
||||||
|
used_authentik_uids = set()
|
||||||
|
|
||||||
|
for table in TABLES_WITH_USER_ID:
|
||||||
|
result = await connection.execute(
|
||||||
|
text(f'SELECT DISTINCT user_id FROM "{table}" WHERE user_id IS NOT NULL')
|
||||||
|
)
|
||||||
|
authentik_uids = [row[0] for row in result.fetchall()]
|
||||||
|
used_authentik_uids.update(authentik_uids)
|
||||||
|
print(f" Found {len(authentik_uids)} unique Authentik UIDs in {table}")
|
||||||
|
|
||||||
|
print(f" Total unique user IDs found: {len(used_authentik_uids)}")
|
||||||
|
|
||||||
|
if used_authentik_uids:
|
||||||
|
sample_id = next(iter(used_authentik_uids))
|
||||||
|
if len(sample_id) == 36 and sample_id.count("-") == 4:
|
||||||
|
print(
|
||||||
|
f"\n✅ User IDs are already in UUID format (e.g., {sample_id[:20]}...)"
|
||||||
|
)
|
||||||
|
print("Migration has already been completed!")
|
||||||
|
return set()
|
||||||
|
|
||||||
|
return used_authentik_uids
|
||||||
|
|
||||||
|
|
||||||
|
def filter_users_by_authentik_uid(
|
||||||
|
authentik_users: list[dict[str, Any]], used_authentik_uids: set[str]
|
||||||
|
) -> tuple[list[dict[str, Any]], set[str]]:
|
||||||
|
used_authentik_users = [
|
||||||
|
user for user in authentik_users if user.get("uid") in used_authentik_uids
|
||||||
|
]
|
||||||
|
|
||||||
|
missing_ids = used_authentik_uids - {u.get("uid") for u in used_authentik_users}
|
||||||
|
|
||||||
|
print(
|
||||||
|
f" Found {len(used_authentik_users)} matching users in Authentik "
|
||||||
|
f"(out of {len(authentik_users)} total)"
|
||||||
|
)
|
||||||
|
|
||||||
|
if missing_ids:
|
||||||
|
print(
|
||||||
|
f" ⚠ Warning: {len(missing_ids)} Authentik UIDs in database not found in Authentik:"
|
||||||
|
)
|
||||||
|
for user_id in sorted(missing_ids):
|
||||||
|
print(f" - {user_id}")
|
||||||
|
|
||||||
|
return used_authentik_users, missing_ids
|
||||||
|
|
||||||
|
|
||||||
|
async def sync_users_to_database(
|
||||||
|
connection: AsyncConnection, authentik_users: list[dict[str, Any]]
|
||||||
|
) -> tuple[int, int]:
|
||||||
|
created = 0
|
||||||
|
skipped = 0
|
||||||
|
now = datetime.now(timezone.utc)
|
||||||
|
|
||||||
|
for authentik_user in authentik_users:
|
||||||
|
user_id = authentik_user["uuid"]
|
||||||
|
authentik_uid = authentik_user["uid"]
|
||||||
|
email = authentik_user.get("email")
|
||||||
|
|
||||||
|
if not email:
|
||||||
|
print(f" ⚠ Skipping user {authentik_uid} (no email)")
|
||||||
|
skipped += 1
|
||||||
|
continue
|
||||||
|
|
||||||
|
result = await connection.execute(
|
||||||
|
text("""
|
||||||
|
INSERT INTO "user" (id, email, authentik_uid, created_at, updated_at)
|
||||||
|
VALUES (:id, :email, :authentik_uid, :created_at, :updated_at)
|
||||||
|
ON CONFLICT (id) DO NOTHING
|
||||||
|
"""),
|
||||||
|
{
|
||||||
|
"id": user_id,
|
||||||
|
"email": email,
|
||||||
|
"authentik_uid": authentik_uid,
|
||||||
|
"created_at": now,
|
||||||
|
"updated_at": now,
|
||||||
|
},
|
||||||
|
)
|
||||||
|
if result.rowcount > 0:
|
||||||
|
created += 1
|
||||||
|
|
||||||
|
return created, skipped
|
||||||
|
|
||||||
|
|
||||||
|
async def migrate_all_user_ids(connection: AsyncConnection) -> int:
|
||||||
|
print("\nStep 3: Migrating user_id columns from Authentik UID to internal UUID...")
|
||||||
|
print("(If no rows are updated, migration may have already been completed)")
|
||||||
|
|
||||||
|
total_updated = 0
|
||||||
|
|
||||||
|
for table in TABLES_WITH_USER_ID:
|
||||||
|
null_check = (
|
||||||
|
f"AND {table}.user_id IS NOT NULL"
|
||||||
|
if table in NULLABLE_USER_ID_TABLES
|
||||||
|
else ""
|
||||||
|
)
|
||||||
|
|
||||||
|
query = f"""
|
||||||
|
UPDATE {table}
|
||||||
|
SET user_id = u.id
|
||||||
|
FROM "user" u
|
||||||
|
WHERE {table}.user_id = u.authentik_uid
|
||||||
|
{null_check}
|
||||||
|
"""
|
||||||
|
|
||||||
|
print(f" Updating {table}.user_id...")
|
||||||
|
result = await connection.execute(text(query))
|
||||||
|
rows = result.rowcount
|
||||||
|
print(f" ✓ Updated {rows} rows")
|
||||||
|
total_updated += rows
|
||||||
|
|
||||||
|
return total_updated
|
||||||
|
|
||||||
|
|
||||||
|
async def run_migration(
|
||||||
|
database_url: str, authentik_api_url: str, authentik_api_token: str
|
||||||
|
) -> None:
|
||||||
|
engine = create_async_engine(database_url)
|
||||||
|
|
||||||
|
try:
|
||||||
|
async with engine.begin() as connection:
|
||||||
|
used_authentik_uids = await collect_used_authentik_uids(connection)
|
||||||
|
if not used_authentik_uids:
|
||||||
|
print("\n⚠️ No user IDs found in database. Nothing to migrate.")
|
||||||
|
print("Migration complete (no-op)!")
|
||||||
|
return
|
||||||
|
|
||||||
|
print("\nStep 2: Fetching user data from Authentik and syncing users...")
|
||||||
|
print("(This script is idempotent - safe to run multiple times)")
|
||||||
|
print(f"Authentik API URL: {authentik_api_url}")
|
||||||
|
|
||||||
|
client = AuthentikClient(authentik_api_url, authentik_api_token)
|
||||||
|
authentik_users = await client.fetch_all_users()
|
||||||
|
|
||||||
|
if not authentik_users:
|
||||||
|
print("\nERROR: No users returned from Authentik API.")
|
||||||
|
print(
|
||||||
|
"Please verify your Authentik configuration and ensure users exist."
|
||||||
|
)
|
||||||
|
sys.exit(1)
|
||||||
|
|
||||||
|
used_authentik_users, _ = filter_users_by_authentik_uid(
|
||||||
|
authentik_users, used_authentik_uids
|
||||||
|
)
|
||||||
|
created, skipped = await sync_users_to_database(
|
||||||
|
connection, used_authentik_users
|
||||||
|
)
|
||||||
|
|
||||||
|
if created > 0:
|
||||||
|
print(f"✓ Created {created} users from Authentik")
|
||||||
|
else:
|
||||||
|
print("✓ No new users created (users may already exist)")
|
||||||
|
|
||||||
|
if skipped > 0:
|
||||||
|
print(f" ⚠ Skipped {skipped} users without email")
|
||||||
|
|
||||||
|
result = await connection.execute(text('SELECT COUNT(*) FROM "user"'))
|
||||||
|
user_count = result.scalar()
|
||||||
|
print(f"✓ Users table now has {user_count} users")
|
||||||
|
|
||||||
|
total_updated = await migrate_all_user_ids(connection)
|
||||||
|
|
||||||
|
if total_updated > 0:
|
||||||
|
print(f"\n✅ Migration complete! Updated {total_updated} total rows.")
|
||||||
|
else:
|
||||||
|
print(
|
||||||
|
"\n✅ Migration complete! (No rows updated - migration may have already been completed)"
|
||||||
|
)
|
||||||
|
|
||||||
|
except Exception as e:
|
||||||
|
print(f"\n❌ ERROR: Migration failed: {e}")
|
||||||
|
sys.exit(1)
|
||||||
|
finally:
|
||||||
|
await engine.dispose()
|
||||||
|
|
||||||
|
|
||||||
|
async def main() -> None:
|
||||||
|
database_url = os.getenv("DATABASE_URL")
|
||||||
|
authentik_api_url = os.getenv("AUTHENTIK_API_URL")
|
||||||
|
authentik_api_token = os.getenv("AUTHENTIK_API_TOKEN")
|
||||||
|
|
||||||
|
if not database_url or not authentik_api_url or not authentik_api_token:
|
||||||
|
print(
|
||||||
|
"ERROR: DATABASE_URL, AUTHENTIK_API_URL, and AUTHENTIK_API_TOKEN must be set"
|
||||||
|
)
|
||||||
|
sys.exit(1)
|
||||||
|
|
||||||
|
await run_migration(database_url, authentik_api_url, authentik_api_token)
|
||||||
|
|
||||||
|
|
||||||
|
if __name__ == "__main__":
|
||||||
|
asyncio.run(main())
|
||||||
@@ -159,3 +159,78 @@ def test_processor_transcript_segment():
|
|||||||
assert segments[3].start == 30.72
|
assert segments[3].start == 30.72
|
||||||
assert segments[4].start == 31.56
|
assert segments[4].start == 31.56
|
||||||
assert segments[5].start == 32.38
|
assert segments[5].start == 32.38
|
||||||
|
|
||||||
|
|
||||||
|
def test_processor_transcript_segment_multitrack_interleaved():
|
||||||
|
"""Test as_segments(is_multitrack=True) with interleaved speakers.
|
||||||
|
|
||||||
|
Multitrack recordings have words from different speakers sorted by start time,
|
||||||
|
causing frequent speaker alternation. The multitrack mode should group by
|
||||||
|
speaker first, then split into sentences.
|
||||||
|
"""
|
||||||
|
from reflector.processors.types import Transcript, Word
|
||||||
|
|
||||||
|
# Simulate real multitrack data: words sorted by start time, speakers interleave
|
||||||
|
# Speaker 0 says: "Hello there."
|
||||||
|
# Speaker 1 says: "I'm good."
|
||||||
|
# When sorted by time, words interleave
|
||||||
|
transcript = Transcript(
|
||||||
|
words=[
|
||||||
|
Word(text="Hello ", start=0.0, end=0.5, speaker=0),
|
||||||
|
Word(text="I'm ", start=0.5, end=0.8, speaker=1),
|
||||||
|
Word(text="there.", start=0.5, end=1.0, speaker=0),
|
||||||
|
Word(text="good.", start=1.0, end=1.5, speaker=1),
|
||||||
|
]
|
||||||
|
)
|
||||||
|
|
||||||
|
# Default behavior (is_multitrack=False): breaks on every speaker change = 4 segments
|
||||||
|
segments_default = transcript.as_segments(is_multitrack=False)
|
||||||
|
assert len(segments_default) == 4
|
||||||
|
|
||||||
|
# Multitrack behavior: groups by speaker, then sentences = 2 segments
|
||||||
|
segments_multitrack = transcript.as_segments(is_multitrack=True)
|
||||||
|
assert len(segments_multitrack) == 2
|
||||||
|
|
||||||
|
# Check content - sorted by start time
|
||||||
|
assert segments_multitrack[0].speaker == 0
|
||||||
|
assert segments_multitrack[0].text == "Hello there."
|
||||||
|
assert segments_multitrack[0].start == 0.0
|
||||||
|
assert segments_multitrack[0].end == 1.0
|
||||||
|
|
||||||
|
assert segments_multitrack[1].speaker == 1
|
||||||
|
assert segments_multitrack[1].text == "I'm good."
|
||||||
|
assert segments_multitrack[1].start == 0.5
|
||||||
|
assert segments_multitrack[1].end == 1.5
|
||||||
|
|
||||||
|
|
||||||
|
def test_processor_transcript_segment_multitrack_overlapping_timestamps():
|
||||||
|
"""Test multitrack with exactly overlapping timestamps (real Daily.co data pattern)."""
|
||||||
|
from reflector.processors.types import Transcript, Word
|
||||||
|
|
||||||
|
# Real pattern from transcript 38d84d57: words with identical timestamps
|
||||||
|
transcript = Transcript(
|
||||||
|
words=[
|
||||||
|
Word(text="speaking ", start=6.71, end=7.11, speaker=0),
|
||||||
|
Word(text="Speaking ", start=6.71, end=7.11, speaker=1),
|
||||||
|
Word(text="at ", start=7.11, end=7.27, speaker=0),
|
||||||
|
Word(text="at ", start=7.11, end=7.27, speaker=1),
|
||||||
|
Word(text="the ", start=7.27, end=7.43, speaker=0),
|
||||||
|
Word(text="the ", start=7.27, end=7.43, speaker=1),
|
||||||
|
Word(text="same ", start=7.43, end=7.59, speaker=0),
|
||||||
|
Word(text="same ", start=7.43, end=7.59, speaker=1),
|
||||||
|
Word(text="time.", start=7.59, end=8.0, speaker=0),
|
||||||
|
Word(text="time.", start=7.59, end=8.0, speaker=1),
|
||||||
|
]
|
||||||
|
)
|
||||||
|
|
||||||
|
# Default: 10 segments (one per speaker change)
|
||||||
|
segments_default = transcript.as_segments(is_multitrack=False)
|
||||||
|
assert len(segments_default) == 10
|
||||||
|
|
||||||
|
# Multitrack: 2 segments (one per speaker sentence)
|
||||||
|
segments_multitrack = transcript.as_segments(is_multitrack=True)
|
||||||
|
assert len(segments_multitrack) == 2
|
||||||
|
|
||||||
|
# Both should have complete sentences
|
||||||
|
assert "speaking at the same time." in segments_multitrack[0].text
|
||||||
|
assert "Speaking at the same time." in segments_multitrack[1].text
|
||||||
|
|||||||
779
server/tests/test_transcript_formats.py
Normal file
779
server/tests/test_transcript_formats.py
Normal file
@@ -0,0 +1,779 @@
|
|||||||
|
"""Tests for transcript format conversion functionality."""
|
||||||
|
|
||||||
|
import pytest
|
||||||
|
|
||||||
|
from reflector.db.transcripts import TranscriptParticipant, TranscriptTopic
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
from reflector.utils.transcript_formats import (
|
||||||
|
format_timestamp_mmss,
|
||||||
|
get_speaker_name,
|
||||||
|
topics_to_webvtt_named,
|
||||||
|
transcript_to_json_segments,
|
||||||
|
transcript_to_text,
|
||||||
|
transcript_to_text_timestamped,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_get_speaker_name_with_participants():
|
||||||
|
"""Test speaker name resolution with participants list."""
|
||||||
|
participants = [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="John Smith"),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Jane Doe"),
|
||||||
|
]
|
||||||
|
|
||||||
|
assert get_speaker_name(0, participants) == "John Smith"
|
||||||
|
assert get_speaker_name(1, participants) == "Jane Doe"
|
||||||
|
assert get_speaker_name(2, participants) == "Speaker 2"
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_get_speaker_name_without_participants():
|
||||||
|
"""Test speaker name resolution without participants list."""
|
||||||
|
assert get_speaker_name(0, None) == "Speaker 0"
|
||||||
|
assert get_speaker_name(1, None) == "Speaker 1"
|
||||||
|
assert get_speaker_name(5, []) == "Speaker 5"
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_format_timestamp_mmss():
|
||||||
|
"""Test timestamp formatting to MM:SS."""
|
||||||
|
assert format_timestamp_mmss(0) == "00:00"
|
||||||
|
assert format_timestamp_mmss(5) == "00:05"
|
||||||
|
assert format_timestamp_mmss(65) == "01:05"
|
||||||
|
assert format_timestamp_mmss(125.7) == "02:05"
|
||||||
|
assert format_timestamp_mmss(3661) == "61:01"
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_transcript_to_text():
|
||||||
|
"""Test plain text format conversion."""
|
||||||
|
topics = [
|
||||||
|
TranscriptTopic(
|
||||||
|
id="1",
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0.0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0.0, end=1.0, speaker=0),
|
||||||
|
Word(text=" world.", start=1.0, end=2.0, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
TranscriptTopic(
|
||||||
|
id="2",
|
||||||
|
title="Topic 2",
|
||||||
|
summary="Summary 2",
|
||||||
|
timestamp=2.0,
|
||||||
|
words=[
|
||||||
|
Word(text="How", start=2.0, end=3.0, speaker=1),
|
||||||
|
Word(text=" are", start=3.0, end=4.0, speaker=1),
|
||||||
|
Word(text=" you?", start=4.0, end=5.0, speaker=1),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
]
|
||||||
|
|
||||||
|
participants = [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="John Smith"),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Jane Doe"),
|
||||||
|
]
|
||||||
|
|
||||||
|
result = transcript_to_text(topics, participants)
|
||||||
|
lines = result.split("\n")
|
||||||
|
|
||||||
|
assert len(lines) == 2
|
||||||
|
assert lines[0] == "John Smith: Hello world."
|
||||||
|
assert lines[1] == "Jane Doe: How are you?"
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_transcript_to_text_timestamped():
|
||||||
|
"""Test timestamped text format conversion."""
|
||||||
|
topics = [
|
||||||
|
TranscriptTopic(
|
||||||
|
id="1",
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0.0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0.0, end=1.0, speaker=0),
|
||||||
|
Word(text=" world.", start=1.0, end=2.0, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
TranscriptTopic(
|
||||||
|
id="2",
|
||||||
|
title="Topic 2",
|
||||||
|
summary="Summary 2",
|
||||||
|
timestamp=65.0,
|
||||||
|
words=[
|
||||||
|
Word(text="How", start=65.0, end=66.0, speaker=1),
|
||||||
|
Word(text=" are", start=66.0, end=67.0, speaker=1),
|
||||||
|
Word(text=" you?", start=67.0, end=68.0, speaker=1),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
]
|
||||||
|
|
||||||
|
participants = [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="John Smith"),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Jane Doe"),
|
||||||
|
]
|
||||||
|
|
||||||
|
result = transcript_to_text_timestamped(topics, participants)
|
||||||
|
lines = result.split("\n")
|
||||||
|
|
||||||
|
assert len(lines) == 2
|
||||||
|
assert lines[0] == "[00:00] John Smith: Hello world."
|
||||||
|
assert lines[1] == "[01:05] Jane Doe: How are you?"
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_topics_to_webvtt_named():
|
||||||
|
"""Test WebVTT format conversion with participant names."""
|
||||||
|
topics = [
|
||||||
|
TranscriptTopic(
|
||||||
|
id="1",
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0.0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0.0, end=1.0, speaker=0),
|
||||||
|
Word(text=" world.", start=1.0, end=2.0, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
]
|
||||||
|
|
||||||
|
participants = [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="John Smith"),
|
||||||
|
]
|
||||||
|
|
||||||
|
result = topics_to_webvtt_named(topics, participants)
|
||||||
|
|
||||||
|
assert result.startswith("WEBVTT")
|
||||||
|
assert "<v John Smith>" in result
|
||||||
|
assert "00:00:00.000 --> 00:00:02.000" in result
|
||||||
|
assert "Hello world." in result
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_transcript_to_json_segments():
|
||||||
|
"""Test JSON segments format conversion."""
|
||||||
|
topics = [
|
||||||
|
TranscriptTopic(
|
||||||
|
id="1",
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0.0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0.0, end=1.0, speaker=0),
|
||||||
|
Word(text=" world.", start=1.0, end=2.0, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
TranscriptTopic(
|
||||||
|
id="2",
|
||||||
|
title="Topic 2",
|
||||||
|
summary="Summary 2",
|
||||||
|
timestamp=2.0,
|
||||||
|
words=[
|
||||||
|
Word(text="How", start=2.0, end=3.0, speaker=1),
|
||||||
|
Word(text=" are", start=3.0, end=4.0, speaker=1),
|
||||||
|
Word(text=" you?", start=4.0, end=5.0, speaker=1),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
]
|
||||||
|
|
||||||
|
participants = [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="John Smith"),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Jane Doe"),
|
||||||
|
]
|
||||||
|
|
||||||
|
result = transcript_to_json_segments(topics, participants)
|
||||||
|
|
||||||
|
assert len(result) == 2
|
||||||
|
assert result[0].speaker == 0
|
||||||
|
assert result[0].speaker_name == "John Smith"
|
||||||
|
assert result[0].text == "Hello world."
|
||||||
|
assert result[0].start == 0.0
|
||||||
|
assert result[0].end == 2.0
|
||||||
|
|
||||||
|
assert result[1].speaker == 1
|
||||||
|
assert result[1].speaker_name == "Jane Doe"
|
||||||
|
assert result[1].text == "How are you?"
|
||||||
|
assert result[1].start == 2.0
|
||||||
|
assert result[1].end == 5.0
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_transcript_formats_with_empty_topics():
|
||||||
|
"""Test format conversion with empty topics list."""
|
||||||
|
topics = []
|
||||||
|
participants = []
|
||||||
|
|
||||||
|
assert transcript_to_text(topics, participants) == ""
|
||||||
|
assert transcript_to_text_timestamped(topics, participants) == ""
|
||||||
|
assert "WEBVTT" in topics_to_webvtt_named(topics, participants)
|
||||||
|
assert transcript_to_json_segments(topics, participants) == []
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_transcript_formats_with_empty_words():
|
||||||
|
"""Test format conversion with topics containing no words."""
|
||||||
|
topics = [
|
||||||
|
TranscriptTopic(
|
||||||
|
id="1",
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0.0,
|
||||||
|
words=[],
|
||||||
|
),
|
||||||
|
]
|
||||||
|
participants = []
|
||||||
|
|
||||||
|
assert transcript_to_text(topics, participants) == ""
|
||||||
|
assert transcript_to_text_timestamped(topics, participants) == ""
|
||||||
|
assert "WEBVTT" in topics_to_webvtt_named(topics, participants)
|
||||||
|
assert transcript_to_json_segments(topics, participants) == []
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_transcript_formats_with_multiple_speakers():
|
||||||
|
"""Test format conversion with multiple speaker changes."""
|
||||||
|
topics = [
|
||||||
|
TranscriptTopic(
|
||||||
|
id="1",
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0.0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0.0, end=1.0, speaker=0),
|
||||||
|
Word(text=" there.", start=1.0, end=2.0, speaker=0),
|
||||||
|
Word(text="Hi", start=2.0, end=3.0, speaker=1),
|
||||||
|
Word(text=" back.", start=3.0, end=4.0, speaker=1),
|
||||||
|
Word(text="Good", start=4.0, end=5.0, speaker=0),
|
||||||
|
Word(text=" morning.", start=5.0, end=6.0, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
]
|
||||||
|
|
||||||
|
participants = [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="Alice"),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Bob"),
|
||||||
|
]
|
||||||
|
|
||||||
|
text_result = transcript_to_text(topics, participants)
|
||||||
|
lines = text_result.split("\n")
|
||||||
|
assert len(lines) == 3
|
||||||
|
assert "Alice: Hello there." in lines[0]
|
||||||
|
assert "Bob: Hi back." in lines[1]
|
||||||
|
assert "Alice: Good morning." in lines[2]
|
||||||
|
|
||||||
|
json_result = transcript_to_json_segments(topics, participants)
|
||||||
|
assert len(json_result) == 3
|
||||||
|
assert json_result[0].speaker_name == "Alice"
|
||||||
|
assert json_result[1].speaker_name == "Bob"
|
||||||
|
assert json_result[2].speaker_name == "Alice"
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_transcript_formats_with_overlapping_speakers_multitrack():
|
||||||
|
"""Test format conversion for multitrack recordings with truly interleaved words.
|
||||||
|
|
||||||
|
Multitrack recordings have words from different speakers sorted by start time,
|
||||||
|
causing frequent speaker alternation. This tests the sentence-based segmentation
|
||||||
|
that groups each speaker's words into complete sentences.
|
||||||
|
"""
|
||||||
|
# Real multitrack data: words sorted by start time, speakers interleave
|
||||||
|
# Alice says: "Hello there." (0.0-1.0)
|
||||||
|
# Bob says: "I'm good." (0.5-1.5)
|
||||||
|
# When sorted by time, words interleave: Hello, I'm, there., good.
|
||||||
|
topics = [
|
||||||
|
TranscriptTopic(
|
||||||
|
id="1",
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0.0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello ", start=0.0, end=0.5, speaker=0),
|
||||||
|
Word(text="I'm ", start=0.5, end=0.8, speaker=1),
|
||||||
|
Word(text="there.", start=0.5, end=1.0, speaker=0),
|
||||||
|
Word(text="good.", start=1.0, end=1.5, speaker=1),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
]
|
||||||
|
|
||||||
|
participants = [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="Alice"),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Bob"),
|
||||||
|
]
|
||||||
|
|
||||||
|
# With is_multitrack=True, should produce 2 segments (one per speaker sentence)
|
||||||
|
# not 4 segments (one per speaker change)
|
||||||
|
webvtt_result = topics_to_webvtt_named(topics, participants, is_multitrack=True)
|
||||||
|
expected_webvtt = """WEBVTT
|
||||||
|
|
||||||
|
00:00:00.000 --> 00:00:01.000
|
||||||
|
<v Alice>Hello there.
|
||||||
|
|
||||||
|
00:00:00.500 --> 00:00:01.500
|
||||||
|
<v Bob>I'm good.
|
||||||
|
"""
|
||||||
|
assert webvtt_result == expected_webvtt
|
||||||
|
|
||||||
|
text_result = transcript_to_text(topics, participants, is_multitrack=True)
|
||||||
|
lines = text_result.split("\n")
|
||||||
|
assert len(lines) == 2
|
||||||
|
assert "Alice: Hello there." in lines[0]
|
||||||
|
assert "Bob: I'm good." in lines[1]
|
||||||
|
|
||||||
|
timestamped_result = transcript_to_text_timestamped(
|
||||||
|
topics, participants, is_multitrack=True
|
||||||
|
)
|
||||||
|
timestamped_lines = timestamped_result.split("\n")
|
||||||
|
assert len(timestamped_lines) == 2
|
||||||
|
assert "[00:00] Alice: Hello there." in timestamped_lines[0]
|
||||||
|
assert "[00:00] Bob: I'm good." in timestamped_lines[1]
|
||||||
|
|
||||||
|
segments = transcript_to_json_segments(topics, participants, is_multitrack=True)
|
||||||
|
assert len(segments) == 2
|
||||||
|
assert segments[0].speaker_name == "Alice"
|
||||||
|
assert segments[0].text == "Hello there."
|
||||||
|
assert segments[1].speaker_name == "Bob"
|
||||||
|
assert segments[1].text == "I'm good."
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_api_transcript_format_text(client):
|
||||||
|
"""Test GET /transcripts/{id} with transcript_format=text."""
|
||||||
|
response = await client.post("/transcripts", json={"name": "Test transcript"})
|
||||||
|
assert response.status_code == 200
|
||||||
|
tid = response.json()["id"]
|
||||||
|
|
||||||
|
from reflector.db.transcripts import (
|
||||||
|
TranscriptParticipant,
|
||||||
|
TranscriptTopic,
|
||||||
|
transcripts_controller,
|
||||||
|
)
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
|
||||||
|
transcript = await transcripts_controller.get_by_id(tid)
|
||||||
|
|
||||||
|
await transcripts_controller.update(
|
||||||
|
transcript,
|
||||||
|
{
|
||||||
|
"participants": [
|
||||||
|
TranscriptParticipant(
|
||||||
|
id="1", speaker=0, name="John Smith"
|
||||||
|
).model_dump(),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Jane Doe").model_dump(),
|
||||||
|
]
|
||||||
|
},
|
||||||
|
)
|
||||||
|
|
||||||
|
await transcripts_controller.upsert_topic(
|
||||||
|
transcript,
|
||||||
|
TranscriptTopic(
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0, end=1, speaker=0),
|
||||||
|
Word(text=" world.", start=1, end=2, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
response = await client.get(f"/transcripts/{tid}?transcript_format=text")
|
||||||
|
assert response.status_code == 200
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
assert data["transcript_format"] == "text"
|
||||||
|
assert "transcript" in data
|
||||||
|
assert "John Smith: Hello world." in data["transcript"]
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_api_transcript_format_text_timestamped(client):
|
||||||
|
"""Test GET /transcripts/{id} with transcript_format=text-timestamped."""
|
||||||
|
response = await client.post("/transcripts", json={"name": "Test transcript"})
|
||||||
|
assert response.status_code == 200
|
||||||
|
tid = response.json()["id"]
|
||||||
|
|
||||||
|
from reflector.db.transcripts import (
|
||||||
|
TranscriptParticipant,
|
||||||
|
TranscriptTopic,
|
||||||
|
transcripts_controller,
|
||||||
|
)
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
|
||||||
|
transcript = await transcripts_controller.get_by_id(tid)
|
||||||
|
|
||||||
|
await transcripts_controller.update(
|
||||||
|
transcript,
|
||||||
|
{
|
||||||
|
"participants": [
|
||||||
|
TranscriptParticipant(
|
||||||
|
id="1", speaker=0, name="John Smith"
|
||||||
|
).model_dump(),
|
||||||
|
]
|
||||||
|
},
|
||||||
|
)
|
||||||
|
|
||||||
|
await transcripts_controller.upsert_topic(
|
||||||
|
transcript,
|
||||||
|
TranscriptTopic(
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=65, end=66, speaker=0),
|
||||||
|
Word(text=" world.", start=66, end=67, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
response = await client.get(
|
||||||
|
f"/transcripts/{tid}?transcript_format=text-timestamped"
|
||||||
|
)
|
||||||
|
assert response.status_code == 200
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
assert data["transcript_format"] == "text-timestamped"
|
||||||
|
assert "transcript" in data
|
||||||
|
assert "[01:05] John Smith: Hello world." in data["transcript"]
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_api_transcript_format_webvtt_named(client):
|
||||||
|
"""Test GET /transcripts/{id} with transcript_format=webvtt-named."""
|
||||||
|
response = await client.post("/transcripts", json={"name": "Test transcript"})
|
||||||
|
assert response.status_code == 200
|
||||||
|
tid = response.json()["id"]
|
||||||
|
|
||||||
|
from reflector.db.transcripts import (
|
||||||
|
TranscriptParticipant,
|
||||||
|
TranscriptTopic,
|
||||||
|
transcripts_controller,
|
||||||
|
)
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
|
||||||
|
transcript = await transcripts_controller.get_by_id(tid)
|
||||||
|
|
||||||
|
await transcripts_controller.update(
|
||||||
|
transcript,
|
||||||
|
{
|
||||||
|
"participants": [
|
||||||
|
TranscriptParticipant(
|
||||||
|
id="1", speaker=0, name="John Smith"
|
||||||
|
).model_dump(),
|
||||||
|
]
|
||||||
|
},
|
||||||
|
)
|
||||||
|
|
||||||
|
await transcripts_controller.upsert_topic(
|
||||||
|
transcript,
|
||||||
|
TranscriptTopic(
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0, end=1, speaker=0),
|
||||||
|
Word(text=" world.", start=1, end=2, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
response = await client.get(f"/transcripts/{tid}?transcript_format=webvtt-named")
|
||||||
|
assert response.status_code == 200
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
assert data["transcript_format"] == "webvtt-named"
|
||||||
|
assert "transcript" in data
|
||||||
|
assert "WEBVTT" in data["transcript"]
|
||||||
|
assert "<v John Smith>" in data["transcript"]
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_api_transcript_format_json(client):
|
||||||
|
"""Test GET /transcripts/{id} with transcript_format=json."""
|
||||||
|
response = await client.post("/transcripts", json={"name": "Test transcript"})
|
||||||
|
assert response.status_code == 200
|
||||||
|
tid = response.json()["id"]
|
||||||
|
|
||||||
|
from reflector.db.transcripts import (
|
||||||
|
TranscriptParticipant,
|
||||||
|
TranscriptTopic,
|
||||||
|
transcripts_controller,
|
||||||
|
)
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
|
||||||
|
transcript = await transcripts_controller.get_by_id(tid)
|
||||||
|
|
||||||
|
await transcripts_controller.update(
|
||||||
|
transcript,
|
||||||
|
{
|
||||||
|
"participants": [
|
||||||
|
TranscriptParticipant(
|
||||||
|
id="1", speaker=0, name="John Smith"
|
||||||
|
).model_dump(),
|
||||||
|
]
|
||||||
|
},
|
||||||
|
)
|
||||||
|
|
||||||
|
await transcripts_controller.upsert_topic(
|
||||||
|
transcript,
|
||||||
|
TranscriptTopic(
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0, end=1, speaker=0),
|
||||||
|
Word(text=" world.", start=1, end=2, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
response = await client.get(f"/transcripts/{tid}?transcript_format=json")
|
||||||
|
assert response.status_code == 200
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
assert data["transcript_format"] == "json"
|
||||||
|
assert "transcript" in data
|
||||||
|
assert isinstance(data["transcript"], list)
|
||||||
|
assert len(data["transcript"]) == 1
|
||||||
|
assert data["transcript"][0]["speaker"] == 0
|
||||||
|
assert data["transcript"][0]["speaker_name"] == "John Smith"
|
||||||
|
assert data["transcript"][0]["text"] == "Hello world."
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_api_transcript_format_default_is_text(client):
|
||||||
|
"""Test GET /transcripts/{id} defaults to text format."""
|
||||||
|
response = await client.post("/transcripts", json={"name": "Test transcript"})
|
||||||
|
assert response.status_code == 200
|
||||||
|
tid = response.json()["id"]
|
||||||
|
|
||||||
|
from reflector.db.transcripts import TranscriptTopic, transcripts_controller
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
|
||||||
|
transcript = await transcripts_controller.get_by_id(tid)
|
||||||
|
|
||||||
|
await transcripts_controller.upsert_topic(
|
||||||
|
transcript,
|
||||||
|
TranscriptTopic(
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello", start=0, end=1, speaker=0),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
response = await client.get(f"/transcripts/{tid}")
|
||||||
|
assert response.status_code == 200
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
assert data["transcript_format"] == "text"
|
||||||
|
assert "transcript" in data
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_api_topics_endpoint_multitrack_segmentation(client):
|
||||||
|
"""Test GET /transcripts/{id}/topics uses sentence-based segmentation for multitrack.
|
||||||
|
|
||||||
|
This tests the fix for TASKS2.md - ensuring /topics endpoints correctly detect
|
||||||
|
multitrack recordings and use sentence-based segmentation instead of fragmenting
|
||||||
|
on every speaker change.
|
||||||
|
"""
|
||||||
|
from datetime import datetime, timezone
|
||||||
|
|
||||||
|
from reflector.db.recordings import Recording, recordings_controller
|
||||||
|
from reflector.db.transcripts import (
|
||||||
|
TranscriptParticipant,
|
||||||
|
TranscriptTopic,
|
||||||
|
transcripts_controller,
|
||||||
|
)
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
|
||||||
|
# Create a multitrack recording (has track_keys)
|
||||||
|
recording = Recording(
|
||||||
|
bucket_name="test-bucket",
|
||||||
|
object_key="test-key",
|
||||||
|
recorded_at=datetime.now(timezone.utc),
|
||||||
|
track_keys=["track1.webm", "track2.webm"], # This makes it multitrack
|
||||||
|
)
|
||||||
|
await recordings_controller.create(recording)
|
||||||
|
|
||||||
|
# Create transcript linked to the recording
|
||||||
|
transcript = await transcripts_controller.add(
|
||||||
|
name="Multitrack Test",
|
||||||
|
source_kind="file",
|
||||||
|
recording_id=recording.id,
|
||||||
|
)
|
||||||
|
|
||||||
|
await transcripts_controller.update(
|
||||||
|
transcript,
|
||||||
|
{
|
||||||
|
"participants": [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="Alice").model_dump(),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Bob").model_dump(),
|
||||||
|
]
|
||||||
|
},
|
||||||
|
)
|
||||||
|
|
||||||
|
# Add interleaved words (as they appear in real multitrack data)
|
||||||
|
await transcripts_controller.upsert_topic(
|
||||||
|
transcript,
|
||||||
|
TranscriptTopic(
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello ", start=0.0, end=0.5, speaker=0),
|
||||||
|
Word(text="I'm ", start=0.5, end=0.8, speaker=1),
|
||||||
|
Word(text="there.", start=0.5, end=1.0, speaker=0),
|
||||||
|
Word(text="good.", start=1.0, end=1.5, speaker=1),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
# Test /topics endpoint
|
||||||
|
response = await client.get(f"/transcripts/{transcript.id}/topics")
|
||||||
|
assert response.status_code == 200
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
assert len(data) == 1
|
||||||
|
topic = data[0]
|
||||||
|
|
||||||
|
# Key assertion: multitrack should produce 2 segments (one per speaker sentence)
|
||||||
|
# Not 4 segments (one per speaker change)
|
||||||
|
assert len(topic["segments"]) == 2
|
||||||
|
|
||||||
|
# Check content
|
||||||
|
segment_texts = [s["text"] for s in topic["segments"]]
|
||||||
|
assert "Hello there." in segment_texts
|
||||||
|
assert "I'm good." in segment_texts
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_api_topics_endpoint_non_multitrack_segmentation(client):
|
||||||
|
"""Test GET /transcripts/{id}/topics uses default segmentation for non-multitrack.
|
||||||
|
|
||||||
|
Ensures backward compatibility - transcripts without multitrack recordings
|
||||||
|
should continue using the default speaker-change-based segmentation.
|
||||||
|
"""
|
||||||
|
from reflector.db.transcripts import (
|
||||||
|
TranscriptParticipant,
|
||||||
|
TranscriptTopic,
|
||||||
|
transcripts_controller,
|
||||||
|
)
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
|
||||||
|
# Create transcript WITHOUT recording (defaulted as not multitrack) TODO better heuristic
|
||||||
|
response = await client.post("/transcripts", json={"name": "Test transcript"})
|
||||||
|
assert response.status_code == 200
|
||||||
|
tid = response.json()["id"]
|
||||||
|
|
||||||
|
transcript = await transcripts_controller.get_by_id(tid)
|
||||||
|
|
||||||
|
await transcripts_controller.update(
|
||||||
|
transcript,
|
||||||
|
{
|
||||||
|
"participants": [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="Alice").model_dump(),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Bob").model_dump(),
|
||||||
|
]
|
||||||
|
},
|
||||||
|
)
|
||||||
|
|
||||||
|
# Add interleaved words
|
||||||
|
await transcripts_controller.upsert_topic(
|
||||||
|
transcript,
|
||||||
|
TranscriptTopic(
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello ", start=0.0, end=0.5, speaker=0),
|
||||||
|
Word(text="I'm ", start=0.5, end=0.8, speaker=1),
|
||||||
|
Word(text="there.", start=0.5, end=1.0, speaker=0),
|
||||||
|
Word(text="good.", start=1.0, end=1.5, speaker=1),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
# Test /topics endpoint
|
||||||
|
response = await client.get(f"/transcripts/{tid}/topics")
|
||||||
|
assert response.status_code == 200
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
assert len(data) == 1
|
||||||
|
topic = data[0]
|
||||||
|
|
||||||
|
# Non-multitrack: should produce 4 segments (one per speaker change)
|
||||||
|
assert len(topic["segments"]) == 4
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.asyncio
|
||||||
|
async def test_api_topics_with_words_endpoint_multitrack(client):
|
||||||
|
"""Test GET /transcripts/{id}/topics/with-words uses multitrack segmentation."""
|
||||||
|
from datetime import datetime, timezone
|
||||||
|
|
||||||
|
from reflector.db.recordings import Recording, recordings_controller
|
||||||
|
from reflector.db.transcripts import (
|
||||||
|
TranscriptParticipant,
|
||||||
|
TranscriptTopic,
|
||||||
|
transcripts_controller,
|
||||||
|
)
|
||||||
|
from reflector.processors.types import Word
|
||||||
|
|
||||||
|
# Create multitrack recording
|
||||||
|
recording = Recording(
|
||||||
|
bucket_name="test-bucket",
|
||||||
|
object_key="test-key-2",
|
||||||
|
recorded_at=datetime.now(timezone.utc),
|
||||||
|
track_keys=["track1.webm", "track2.webm"],
|
||||||
|
)
|
||||||
|
await recordings_controller.create(recording)
|
||||||
|
|
||||||
|
transcript = await transcripts_controller.add(
|
||||||
|
name="Multitrack Test 2",
|
||||||
|
source_kind="file",
|
||||||
|
recording_id=recording.id,
|
||||||
|
)
|
||||||
|
|
||||||
|
await transcripts_controller.update(
|
||||||
|
transcript,
|
||||||
|
{
|
||||||
|
"participants": [
|
||||||
|
TranscriptParticipant(id="1", speaker=0, name="Alice").model_dump(),
|
||||||
|
TranscriptParticipant(id="2", speaker=1, name="Bob").model_dump(),
|
||||||
|
]
|
||||||
|
},
|
||||||
|
)
|
||||||
|
|
||||||
|
await transcripts_controller.upsert_topic(
|
||||||
|
transcript,
|
||||||
|
TranscriptTopic(
|
||||||
|
title="Topic 1",
|
||||||
|
summary="Summary 1",
|
||||||
|
timestamp=0,
|
||||||
|
words=[
|
||||||
|
Word(text="Hello ", start=0.0, end=0.5, speaker=0),
|
||||||
|
Word(text="I'm ", start=0.5, end=0.8, speaker=1),
|
||||||
|
Word(text="there.", start=0.5, end=1.0, speaker=0),
|
||||||
|
Word(text="good.", start=1.0, end=1.5, speaker=1),
|
||||||
|
],
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
response = await client.get(f"/transcripts/{transcript.id}/topics/with-words")
|
||||||
|
assert response.status_code == 200
|
||||||
|
data = response.json()
|
||||||
|
|
||||||
|
assert len(data) == 1
|
||||||
|
topic = data[0]
|
||||||
|
|
||||||
|
# Should have 2 segments (multitrack sentence-based)
|
||||||
|
assert len(topic["segments"]) == 2
|
||||||
|
# Should also have words field
|
||||||
|
assert "words" in topic
|
||||||
|
assert len(topic["words"]) == 4
|
||||||
@@ -139,10 +139,10 @@ async def test_whereby_recording_uses_file_pipeline(client):
|
|||||||
|
|
||||||
with (
|
with (
|
||||||
patch(
|
patch(
|
||||||
"reflector.views.transcripts_process.task_pipeline_file_process"
|
"reflector.services.transcript_process.task_pipeline_file_process"
|
||||||
) as mock_file_pipeline,
|
) as mock_file_pipeline,
|
||||||
patch(
|
patch(
|
||||||
"reflector.views.transcripts_process.task_pipeline_multitrack_process"
|
"reflector.services.transcript_process.task_pipeline_multitrack_process"
|
||||||
) as mock_multitrack_pipeline,
|
) as mock_multitrack_pipeline,
|
||||||
):
|
):
|
||||||
response = await client.post(f"/transcripts/{transcript.id}/process")
|
response = await client.post(f"/transcripts/{transcript.id}/process")
|
||||||
@@ -194,10 +194,10 @@ async def test_dailyco_recording_uses_multitrack_pipeline(client):
|
|||||||
|
|
||||||
with (
|
with (
|
||||||
patch(
|
patch(
|
||||||
"reflector.views.transcripts_process.task_pipeline_file_process"
|
"reflector.services.transcript_process.task_pipeline_file_process"
|
||||||
) as mock_file_pipeline,
|
) as mock_file_pipeline,
|
||||||
patch(
|
patch(
|
||||||
"reflector.views.transcripts_process.task_pipeline_multitrack_process"
|
"reflector.services.transcript_process.task_pipeline_multitrack_process"
|
||||||
) as mock_multitrack_pipeline,
|
) as mock_multitrack_pipeline,
|
||||||
):
|
):
|
||||||
response = await client.post(f"/transcripts/{transcript.id}/process")
|
response = await client.post(f"/transcripts/{transcript.id}/process")
|
||||||
|
|||||||
@@ -120,7 +120,15 @@ async def test_user_ws_accepts_valid_token_and_receives_events(appserver_ws_user
|
|||||||
host, port = appserver_ws_user
|
host, port = appserver_ws_user
|
||||||
base_ws = f"http://{host}:{port}/v1/events"
|
base_ws = f"http://{host}:{port}/v1/events"
|
||||||
|
|
||||||
token = _make_dummy_jwt("user-abc")
|
# Create a test user in the database
|
||||||
|
from reflector.db.users import user_controller
|
||||||
|
|
||||||
|
test_uid = "user-abc"
|
||||||
|
user = await user_controller.create_or_update(
|
||||||
|
id="test-user-id-abc", authentik_uid=test_uid, email="user-abc@example.com"
|
||||||
|
)
|
||||||
|
|
||||||
|
token = _make_dummy_jwt(test_uid)
|
||||||
subprotocols = ["bearer", token]
|
subprotocols = ["bearer", token]
|
||||||
|
|
||||||
# Connect and then trigger an event via HTTP create
|
# Connect and then trigger an event via HTTP create
|
||||||
@@ -132,12 +140,13 @@ async def test_user_ws_accepts_valid_token_and_receives_events(appserver_ws_user
|
|||||||
from reflector.auth import current_user, current_user_optional
|
from reflector.auth import current_user, current_user_optional
|
||||||
|
|
||||||
# Override auth dependencies so HTTP request is performed as the same user
|
# Override auth dependencies so HTTP request is performed as the same user
|
||||||
|
# Use the internal user.id (not the Authentik UID)
|
||||||
app.dependency_overrides[current_user] = lambda: {
|
app.dependency_overrides[current_user] = lambda: {
|
||||||
"sub": "user-abc",
|
"sub": user.id,
|
||||||
"email": "user-abc@example.com",
|
"email": "user-abc@example.com",
|
||||||
}
|
}
|
||||||
app.dependency_overrides[current_user_optional] = lambda: {
|
app.dependency_overrides[current_user_optional] = lambda: {
|
||||||
"sub": "user-abc",
|
"sub": user.id,
|
||||||
"email": "user-abc@example.com",
|
"email": "user-abc@example.com",
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
@@ -22,9 +22,10 @@ AUTHENTIK_CLIENT_SECRET=your-client-secret-here
|
|||||||
|
|
||||||
# API URLs
|
# API URLs
|
||||||
API_URL=http://127.0.0.1:1250
|
API_URL=http://127.0.0.1:1250
|
||||||
|
SERVER_API_URL=http://server:1250
|
||||||
WEBSOCKET_URL=ws://127.0.0.1:1250
|
WEBSOCKET_URL=ws://127.0.0.1:1250
|
||||||
AUTH_CALLBACK_URL=http://localhost:3000/auth-callback
|
AUTH_CALLBACK_URL=http://localhost:3000/auth-callback
|
||||||
|
|
||||||
# Sentry
|
# Sentry
|
||||||
# SENTRY_DSN=https://your-dsn@sentry.io/project-id
|
# SENTRY_DSN=https://your-dsn@sentry.io/project-id
|
||||||
# SENTRY_IGNORE_API_RESOLUTION_ERROR=1
|
# SENTRY_IGNORE_API_RESOLUTION_ERROR=1
|
||||||
|
|||||||
@@ -67,6 +67,11 @@ const recordingTypeOptions: SelectOption[] = [
|
|||||||
{ label: "Cloud", value: "cloud" },
|
{ label: "Cloud", value: "cloud" },
|
||||||
];
|
];
|
||||||
|
|
||||||
|
const platformOptions: SelectOption[] = [
|
||||||
|
{ label: "Whereby", value: "whereby" },
|
||||||
|
{ label: "Daily", value: "daily" },
|
||||||
|
];
|
||||||
|
|
||||||
const roomInitialState = {
|
const roomInitialState = {
|
||||||
name: "",
|
name: "",
|
||||||
zulipAutoPost: false,
|
zulipAutoPost: false,
|
||||||
@@ -82,6 +87,7 @@ const roomInitialState = {
|
|||||||
icsUrl: "",
|
icsUrl: "",
|
||||||
icsEnabled: false,
|
icsEnabled: false,
|
||||||
icsFetchInterval: 5,
|
icsFetchInterval: 5,
|
||||||
|
platform: "whereby",
|
||||||
};
|
};
|
||||||
|
|
||||||
export default function RoomsList() {
|
export default function RoomsList() {
|
||||||
@@ -99,6 +105,11 @@ export default function RoomsList() {
|
|||||||
const recordingTypeCollection = createListCollection({
|
const recordingTypeCollection = createListCollection({
|
||||||
items: recordingTypeOptions,
|
items: recordingTypeOptions,
|
||||||
});
|
});
|
||||||
|
|
||||||
|
const platformCollection = createListCollection({
|
||||||
|
items: platformOptions,
|
||||||
|
});
|
||||||
|
|
||||||
const [roomInput, setRoomInput] = useState<null | typeof roomInitialState>(
|
const [roomInput, setRoomInput] = useState<null | typeof roomInitialState>(
|
||||||
null,
|
null,
|
||||||
);
|
);
|
||||||
@@ -143,15 +154,24 @@ export default function RoomsList() {
|
|||||||
zulipStream: detailedEditedRoom.zulip_stream,
|
zulipStream: detailedEditedRoom.zulip_stream,
|
||||||
zulipTopic: detailedEditedRoom.zulip_topic,
|
zulipTopic: detailedEditedRoom.zulip_topic,
|
||||||
isLocked: detailedEditedRoom.is_locked,
|
isLocked: detailedEditedRoom.is_locked,
|
||||||
roomMode: detailedEditedRoom.room_mode,
|
roomMode:
|
||||||
|
detailedEditedRoom.platform === "daily"
|
||||||
|
? "group"
|
||||||
|
: detailedEditedRoom.room_mode,
|
||||||
recordingType: detailedEditedRoom.recording_type,
|
recordingType: detailedEditedRoom.recording_type,
|
||||||
recordingTrigger: detailedEditedRoom.recording_trigger,
|
recordingTrigger:
|
||||||
|
detailedEditedRoom.platform === "daily"
|
||||||
|
? detailedEditedRoom.recording_type === "cloud"
|
||||||
|
? "automatic-2nd-participant"
|
||||||
|
: "none"
|
||||||
|
: detailedEditedRoom.recording_trigger,
|
||||||
isShared: detailedEditedRoom.is_shared,
|
isShared: detailedEditedRoom.is_shared,
|
||||||
webhookUrl: detailedEditedRoom.webhook_url || "",
|
webhookUrl: detailedEditedRoom.webhook_url || "",
|
||||||
webhookSecret: detailedEditedRoom.webhook_secret || "",
|
webhookSecret: detailedEditedRoom.webhook_secret || "",
|
||||||
icsUrl: detailedEditedRoom.ics_url || "",
|
icsUrl: detailedEditedRoom.ics_url || "",
|
||||||
icsEnabled: detailedEditedRoom.ics_enabled || false,
|
icsEnabled: detailedEditedRoom.ics_enabled || false,
|
||||||
icsFetchInterval: detailedEditedRoom.ics_fetch_interval || 5,
|
icsFetchInterval: detailedEditedRoom.ics_fetch_interval || 5,
|
||||||
|
platform: detailedEditedRoom.platform,
|
||||||
}
|
}
|
||||||
: null,
|
: null,
|
||||||
[detailedEditedRoom],
|
[detailedEditedRoom],
|
||||||
@@ -277,21 +297,32 @@ export default function RoomsList() {
|
|||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
const platform: "whereby" | "daily" | null =
|
||||||
|
room.platform === "whereby" || room.platform === "daily"
|
||||||
|
? room.platform
|
||||||
|
: null;
|
||||||
|
|
||||||
const roomData = {
|
const roomData = {
|
||||||
name: room.name,
|
name: room.name,
|
||||||
zulip_auto_post: room.zulipAutoPost,
|
zulip_auto_post: room.zulipAutoPost,
|
||||||
zulip_stream: room.zulipStream,
|
zulip_stream: room.zulipStream,
|
||||||
zulip_topic: room.zulipTopic,
|
zulip_topic: room.zulipTopic,
|
||||||
is_locked: room.isLocked,
|
is_locked: room.isLocked,
|
||||||
room_mode: room.roomMode,
|
room_mode: platform === "daily" ? "group" : room.roomMode,
|
||||||
recording_type: room.recordingType,
|
recording_type: room.recordingType,
|
||||||
recording_trigger: room.recordingTrigger,
|
recording_trigger:
|
||||||
|
platform === "daily"
|
||||||
|
? room.recordingType === "cloud"
|
||||||
|
? "automatic-2nd-participant"
|
||||||
|
: "none"
|
||||||
|
: room.recordingTrigger,
|
||||||
is_shared: room.isShared,
|
is_shared: room.isShared,
|
||||||
webhook_url: room.webhookUrl,
|
webhook_url: room.webhookUrl,
|
||||||
webhook_secret: room.webhookSecret,
|
webhook_secret: room.webhookSecret,
|
||||||
ics_url: room.icsUrl,
|
ics_url: room.icsUrl,
|
||||||
ics_enabled: room.icsEnabled,
|
ics_enabled: room.icsEnabled,
|
||||||
ics_fetch_interval: room.icsFetchInterval,
|
ics_fetch_interval: room.icsFetchInterval,
|
||||||
|
platform,
|
||||||
};
|
};
|
||||||
|
|
||||||
if (isEditing) {
|
if (isEditing) {
|
||||||
@@ -339,15 +370,21 @@ export default function RoomsList() {
|
|||||||
zulipStream: roomData.zulip_stream,
|
zulipStream: roomData.zulip_stream,
|
||||||
zulipTopic: roomData.zulip_topic,
|
zulipTopic: roomData.zulip_topic,
|
||||||
isLocked: roomData.is_locked,
|
isLocked: roomData.is_locked,
|
||||||
roomMode: roomData.room_mode,
|
roomMode: roomData.platform === "daily" ? "group" : roomData.room_mode, // Daily always uses 2-200
|
||||||
recordingType: roomData.recording_type,
|
recordingType: roomData.recording_type,
|
||||||
recordingTrigger: roomData.recording_trigger,
|
recordingTrigger:
|
||||||
|
roomData.platform === "daily"
|
||||||
|
? roomData.recording_type === "cloud"
|
||||||
|
? "automatic-2nd-participant"
|
||||||
|
: "none"
|
||||||
|
: roomData.recording_trigger,
|
||||||
isShared: roomData.is_shared,
|
isShared: roomData.is_shared,
|
||||||
webhookUrl: roomData.webhook_url || "",
|
webhookUrl: roomData.webhook_url || "",
|
||||||
webhookSecret: roomData.webhook_secret || "",
|
webhookSecret: roomData.webhook_secret || "",
|
||||||
icsUrl: roomData.ics_url || "",
|
icsUrl: roomData.ics_url || "",
|
||||||
icsEnabled: roomData.ics_enabled || false,
|
icsEnabled: roomData.ics_enabled || false,
|
||||||
icsFetchInterval: roomData.ics_fetch_interval || 5,
|
icsFetchInterval: roomData.ics_fetch_interval || 5,
|
||||||
|
platform: roomData.platform,
|
||||||
});
|
});
|
||||||
setEditRoomId(roomId);
|
setEditRoomId(roomId);
|
||||||
setIsEditing(true);
|
setIsEditing(true);
|
||||||
@@ -482,6 +519,48 @@ export default function RoomsList() {
|
|||||||
)}
|
)}
|
||||||
</Field.Root>
|
</Field.Root>
|
||||||
|
|
||||||
|
<Field.Root mt={4}>
|
||||||
|
<Field.Label>Platform</Field.Label>
|
||||||
|
<Select.Root
|
||||||
|
value={[room.platform]}
|
||||||
|
onValueChange={(e) => {
|
||||||
|
const newPlatform = e.value[0] as "whereby" | "daily";
|
||||||
|
const updates: Partial<typeof room> = {
|
||||||
|
platform: newPlatform,
|
||||||
|
};
|
||||||
|
if (newPlatform === "daily") {
|
||||||
|
updates.roomMode = "group";
|
||||||
|
updates.recordingTrigger =
|
||||||
|
room.recordingType === "cloud"
|
||||||
|
? "automatic-2nd-participant"
|
||||||
|
: "none";
|
||||||
|
}
|
||||||
|
setRoomInput({ ...room, ...updates });
|
||||||
|
}}
|
||||||
|
collection={platformCollection}
|
||||||
|
>
|
||||||
|
<Select.HiddenSelect />
|
||||||
|
<Select.Control>
|
||||||
|
<Select.Trigger>
|
||||||
|
<Select.ValueText placeholder="Select platform" />
|
||||||
|
</Select.Trigger>
|
||||||
|
<Select.IndicatorGroup>
|
||||||
|
<Select.Indicator />
|
||||||
|
</Select.IndicatorGroup>
|
||||||
|
</Select.Control>
|
||||||
|
<Select.Positioner>
|
||||||
|
<Select.Content>
|
||||||
|
{platformOptions.map((option) => (
|
||||||
|
<Select.Item key={option.value} item={option}>
|
||||||
|
{option.label}
|
||||||
|
<Select.ItemIndicator />
|
||||||
|
</Select.Item>
|
||||||
|
))}
|
||||||
|
</Select.Content>
|
||||||
|
</Select.Positioner>
|
||||||
|
</Select.Root>
|
||||||
|
</Field.Root>
|
||||||
|
|
||||||
<Field.Root mt={4}>
|
<Field.Root mt={4}>
|
||||||
<Checkbox.Root
|
<Checkbox.Root
|
||||||
name="isLocked"
|
name="isLocked"
|
||||||
@@ -512,6 +591,7 @@ export default function RoomsList() {
|
|||||||
setRoomInput({ ...room, roomMode: e.value[0] })
|
setRoomInput({ ...room, roomMode: e.value[0] })
|
||||||
}
|
}
|
||||||
collection={roomModeCollection}
|
collection={roomModeCollection}
|
||||||
|
disabled={room.platform === "daily"}
|
||||||
>
|
>
|
||||||
<Select.HiddenSelect />
|
<Select.HiddenSelect />
|
||||||
<Select.Control>
|
<Select.Control>
|
||||||
@@ -538,16 +618,26 @@ export default function RoomsList() {
|
|||||||
<Field.Label>Recording type</Field.Label>
|
<Field.Label>Recording type</Field.Label>
|
||||||
<Select.Root
|
<Select.Root
|
||||||
value={[room.recordingType]}
|
value={[room.recordingType]}
|
||||||
onValueChange={(e) =>
|
onValueChange={(e) => {
|
||||||
setRoomInput({
|
const newRecordingType = e.value[0];
|
||||||
...room,
|
const updates: Partial<typeof room> = {
|
||||||
recordingType: e.value[0],
|
recordingType: newRecordingType,
|
||||||
recordingTrigger:
|
};
|
||||||
e.value[0] !== "cloud"
|
// For Daily: if cloud, use automatic; otherwise none
|
||||||
|
if (room.platform === "daily") {
|
||||||
|
updates.recordingTrigger =
|
||||||
|
newRecordingType === "cloud"
|
||||||
|
? "automatic-2nd-participant"
|
||||||
|
: "none";
|
||||||
|
} else {
|
||||||
|
// For Whereby: if not cloud, set to none
|
||||||
|
updates.recordingTrigger =
|
||||||
|
newRecordingType !== "cloud"
|
||||||
? "none"
|
? "none"
|
||||||
: room.recordingTrigger,
|
: room.recordingTrigger;
|
||||||
})
|
}
|
||||||
}
|
setRoomInput({ ...room, ...updates });
|
||||||
|
}}
|
||||||
collection={recordingTypeCollection}
|
collection={recordingTypeCollection}
|
||||||
>
|
>
|
||||||
<Select.HiddenSelect />
|
<Select.HiddenSelect />
|
||||||
@@ -572,7 +662,7 @@ export default function RoomsList() {
|
|||||||
</Select.Root>
|
</Select.Root>
|
||||||
</Field.Root>
|
</Field.Root>
|
||||||
<Field.Root mt={4}>
|
<Field.Root mt={4}>
|
||||||
<Field.Label>Cloud recording start trigger</Field.Label>
|
<Field.Label>Recording start trigger</Field.Label>
|
||||||
<Select.Root
|
<Select.Root
|
||||||
value={[room.recordingTrigger]}
|
value={[room.recordingTrigger]}
|
||||||
onValueChange={(e) =>
|
onValueChange={(e) =>
|
||||||
@@ -582,7 +672,11 @@ export default function RoomsList() {
|
|||||||
})
|
})
|
||||||
}
|
}
|
||||||
collection={recordingTriggerCollection}
|
collection={recordingTriggerCollection}
|
||||||
disabled={room.recordingType !== "cloud"}
|
disabled={
|
||||||
|
room.recordingType !== "cloud" ||
|
||||||
|
(room.platform === "daily" &&
|
||||||
|
room.recordingType === "cloud")
|
||||||
|
}
|
||||||
>
|
>
|
||||||
<Select.HiddenSelect />
|
<Select.HiddenSelect />
|
||||||
<Select.Control>
|
<Select.Control>
|
||||||
|
|||||||
@@ -117,15 +117,6 @@ export default function TranscriptDetails(details: TranscriptDetails) {
|
|||||||
return <Modal title="Loading" text={"Loading transcript..."} />;
|
return <Modal title="Loading" text={"Loading transcript..."} />;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (mp3.error) {
|
|
||||||
return (
|
|
||||||
<Modal
|
|
||||||
title="Transcription error"
|
|
||||||
text={`There was an error loading the recording. Error: ${mp3.error}`}
|
|
||||||
/>
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
return (
|
return (
|
||||||
<>
|
<>
|
||||||
<Grid
|
<Grid
|
||||||
@@ -147,7 +138,12 @@ export default function TranscriptDetails(details: TranscriptDetails) {
|
|||||||
/>
|
/>
|
||||||
) : !mp3.loading && (waveform.error || mp3.error) ? (
|
) : !mp3.loading && (waveform.error || mp3.error) ? (
|
||||||
<Box p={4} bg="red.100" borderRadius="md">
|
<Box p={4} bg="red.100" borderRadius="md">
|
||||||
<Text>Error loading this recording</Text>
|
<Text>
|
||||||
|
Error loading{" "}
|
||||||
|
{[waveform.error && "waveform", mp3.error && "mp3"]
|
||||||
|
.filter(Boolean)
|
||||||
|
.join(" and ")}
|
||||||
|
</Text>
|
||||||
</Box>
|
</Box>
|
||||||
) : (
|
) : (
|
||||||
<Skeleton h={14} />
|
<Skeleton h={14} />
|
||||||
|
|||||||
@@ -1,14 +1,16 @@
|
|||||||
import { useState } from "react";
|
import { useState } from "react";
|
||||||
import type { components } from "../../reflector-api";
|
import type { components, operations } from "../../reflector-api";
|
||||||
type GetTranscript = components["schemas"]["GetTranscript"];
|
type GetTranscriptWithParticipants =
|
||||||
|
components["schemas"]["GetTranscriptWithParticipants"];
|
||||||
type GetTranscriptTopic = components["schemas"]["GetTranscriptTopic"];
|
type GetTranscriptTopic = components["schemas"]["GetTranscriptTopic"];
|
||||||
import { Button, BoxProps, Box } from "@chakra-ui/react";
|
import { Button, BoxProps, Box, Menu, Text } from "@chakra-ui/react";
|
||||||
import { buildTranscriptWithTopics } from "./buildTranscriptWithTopics";
|
import { LuChevronDown } from "react-icons/lu";
|
||||||
import { useTranscriptParticipants } from "../../lib/apiHooks";
|
import { client } from "../../lib/apiClient";
|
||||||
|
import { toaster } from "../../components/ui/toaster";
|
||||||
|
|
||||||
type ShareCopyProps = {
|
type ShareCopyProps = {
|
||||||
finalSummaryElement: HTMLDivElement | null;
|
finalSummaryElement: HTMLDivElement | null;
|
||||||
transcript: GetTranscript;
|
transcript: GetTranscriptWithParticipants;
|
||||||
topics: GetTranscriptTopic[];
|
topics: GetTranscriptTopic[];
|
||||||
};
|
};
|
||||||
|
|
||||||
@@ -20,11 +22,33 @@ export default function ShareCopy({
|
|||||||
}: ShareCopyProps & BoxProps) {
|
}: ShareCopyProps & BoxProps) {
|
||||||
const [isCopiedSummary, setIsCopiedSummary] = useState(false);
|
const [isCopiedSummary, setIsCopiedSummary] = useState(false);
|
||||||
const [isCopiedTranscript, setIsCopiedTranscript] = useState(false);
|
const [isCopiedTranscript, setIsCopiedTranscript] = useState(false);
|
||||||
const participantsQuery = useTranscriptParticipants(transcript?.id || null);
|
const [isCopying, setIsCopying] = useState(false);
|
||||||
|
|
||||||
|
type ApiTranscriptFormat = NonNullable<
|
||||||
|
operations["v1_transcript_get"]["parameters"]["query"]
|
||||||
|
>["transcript_format"];
|
||||||
|
const TRANSCRIPT_FORMATS = [
|
||||||
|
"text",
|
||||||
|
"text-timestamped",
|
||||||
|
"webvtt-named",
|
||||||
|
"json",
|
||||||
|
] as const satisfies ApiTranscriptFormat[];
|
||||||
|
type TranscriptFormat = (typeof TRANSCRIPT_FORMATS)[number];
|
||||||
|
|
||||||
|
const TRANSCRIPT_FORMAT_LABELS: { [k in TranscriptFormat]: string } = {
|
||||||
|
text: "Plain text",
|
||||||
|
"text-timestamped": "Text + timestamps",
|
||||||
|
"webvtt-named": "WebVTT (named)",
|
||||||
|
json: "JSON",
|
||||||
|
};
|
||||||
|
|
||||||
|
const formatOptions = TRANSCRIPT_FORMATS.map((f) => ({
|
||||||
|
value: f,
|
||||||
|
label: TRANSCRIPT_FORMAT_LABELS[f],
|
||||||
|
}));
|
||||||
|
|
||||||
const onCopySummaryClick = () => {
|
const onCopySummaryClick = () => {
|
||||||
const text_to_copy = finalSummaryElement?.innerText;
|
const text_to_copy = finalSummaryElement?.innerText;
|
||||||
|
|
||||||
if (text_to_copy) {
|
if (text_to_copy) {
|
||||||
navigator.clipboard.writeText(text_to_copy).then(() => {
|
navigator.clipboard.writeText(text_to_copy).then(() => {
|
||||||
setIsCopiedSummary(true);
|
setIsCopiedSummary(true);
|
||||||
@@ -34,27 +58,91 @@ export default function ShareCopy({
|
|||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
const onCopyTranscriptClick = () => {
|
const onCopyTranscriptFormatClick = async (format: TranscriptFormat) => {
|
||||||
const text_to_copy =
|
try {
|
||||||
buildTranscriptWithTopics(
|
setIsCopying(true);
|
||||||
topics || [],
|
const { data, error } = await client.GET(
|
||||||
participantsQuery?.data || null,
|
"/v1/transcripts/{transcript_id}",
|
||||||
transcript?.title || null,
|
{
|
||||||
) || "";
|
params: {
|
||||||
|
path: { transcript_id: transcript.id },
|
||||||
|
query: { transcript_format: format },
|
||||||
|
},
|
||||||
|
},
|
||||||
|
);
|
||||||
|
if (error) {
|
||||||
|
console.error("Failed to copy transcript:", error);
|
||||||
|
toaster.create({
|
||||||
|
duration: 3000,
|
||||||
|
render: () => (
|
||||||
|
<Box bg="red.500" color="white" px={4} py={3} borderRadius="md">
|
||||||
|
<Text fontWeight="bold">Error</Text>
|
||||||
|
<Text fontSize="sm">Failed to fetch transcript</Text>
|
||||||
|
</Box>
|
||||||
|
),
|
||||||
|
});
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
text_to_copy &&
|
const copiedText =
|
||||||
navigator.clipboard.writeText(text_to_copy).then(() => {
|
format === "json"
|
||||||
|
? JSON.stringify(data?.transcript ?? {}, null, 2)
|
||||||
|
: String(data?.transcript ?? "");
|
||||||
|
|
||||||
|
if (copiedText) {
|
||||||
|
await navigator.clipboard.writeText(copiedText);
|
||||||
setIsCopiedTranscript(true);
|
setIsCopiedTranscript(true);
|
||||||
// Reset the copied state after 2 seconds
|
|
||||||
setTimeout(() => setIsCopiedTranscript(false), 2000);
|
setTimeout(() => setIsCopiedTranscript(false), 2000);
|
||||||
|
}
|
||||||
|
} catch (e) {
|
||||||
|
console.error("Failed to copy transcript:", e);
|
||||||
|
toaster.create({
|
||||||
|
duration: 3000,
|
||||||
|
render: () => (
|
||||||
|
<Box bg="red.500" color="white" px={4} py={3} borderRadius="md">
|
||||||
|
<Text fontWeight="bold">Error</Text>
|
||||||
|
<Text fontSize="sm">Failed to copy transcript</Text>
|
||||||
|
</Box>
|
||||||
|
),
|
||||||
});
|
});
|
||||||
|
} finally {
|
||||||
|
setIsCopying(false);
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
return (
|
return (
|
||||||
<Box {...boxProps}>
|
<Box {...boxProps}>
|
||||||
<Button onClick={onCopyTranscriptClick} mr={2} variant="subtle">
|
<Menu.Root
|
||||||
{isCopiedTranscript ? "Copied!" : "Copy Transcript"}
|
closeOnSelect={true}
|
||||||
</Button>
|
lazyMount={true}
|
||||||
|
positioning={{ gutter: 4 }}
|
||||||
|
>
|
||||||
|
<Menu.Trigger asChild>
|
||||||
|
<Button
|
||||||
|
mr={2}
|
||||||
|
variant="subtle"
|
||||||
|
loading={isCopying}
|
||||||
|
loadingText="Copying..."
|
||||||
|
>
|
||||||
|
{isCopiedTranscript ? "Copied!" : "Copy Transcript"}
|
||||||
|
<LuChevronDown style={{ marginLeft: 6 }} />
|
||||||
|
</Button>
|
||||||
|
</Menu.Trigger>
|
||||||
|
<Menu.Positioner>
|
||||||
|
<Menu.Content>
|
||||||
|
{formatOptions.map((opt) => (
|
||||||
|
<Menu.Item
|
||||||
|
key={opt.value}
|
||||||
|
value={opt.value}
|
||||||
|
_hover={{ backgroundColor: "gray.100" }}
|
||||||
|
onClick={() => onCopyTranscriptFormatClick(opt.value)}
|
||||||
|
>
|
||||||
|
{opt.label}
|
||||||
|
</Menu.Item>
|
||||||
|
))}
|
||||||
|
</Menu.Content>
|
||||||
|
</Menu.Positioner>
|
||||||
|
</Menu.Root>
|
||||||
<Button onClick={onCopySummaryClick} variant="subtle">
|
<Button onClick={onCopySummaryClick} variant="subtle">
|
||||||
{isCopiedSummary ? "Copied!" : "Copy Summary"}
|
{isCopiedSummary ? "Copied!" : "Copy Summary"}
|
||||||
</Button>
|
</Button>
|
||||||
|
|||||||
@@ -1,8 +1,8 @@
|
|||||||
"use client";
|
"use client";
|
||||||
|
|
||||||
import { useCallback, useEffect, useRef } from "react";
|
import { useCallback, useEffect, useRef, useState } from "react";
|
||||||
import { Box } from "@chakra-ui/react";
|
import { Box, Spinner, Center, Text } from "@chakra-ui/react";
|
||||||
import { useRouter } from "next/navigation";
|
import { useRouter, useParams } from "next/navigation";
|
||||||
import DailyIframe, { DailyCall } from "@daily-co/daily-js";
|
import DailyIframe, { DailyCall } from "@daily-co/daily-js";
|
||||||
import type { components } from "../../reflector-api";
|
import type { components } from "../../reflector-api";
|
||||||
import { useAuth } from "../../lib/AuthProvider";
|
import { useAuth } from "../../lib/AuthProvider";
|
||||||
@@ -10,6 +10,8 @@ import {
|
|||||||
ConsentDialogButton,
|
ConsentDialogButton,
|
||||||
recordingTypeRequiresConsent,
|
recordingTypeRequiresConsent,
|
||||||
} from "../../lib/consent";
|
} from "../../lib/consent";
|
||||||
|
import { useRoomJoinMeeting } from "../../lib/apiHooks";
|
||||||
|
import { assertExists } from "../../lib/utils";
|
||||||
|
|
||||||
type Meeting = components["schemas"]["Meeting"];
|
type Meeting = components["schemas"]["Meeting"];
|
||||||
|
|
||||||
@@ -19,20 +21,46 @@ interface DailyRoomProps {
|
|||||||
|
|
||||||
export default function DailyRoom({ meeting }: DailyRoomProps) {
|
export default function DailyRoom({ meeting }: DailyRoomProps) {
|
||||||
const router = useRouter();
|
const router = useRouter();
|
||||||
|
const params = useParams();
|
||||||
const auth = useAuth();
|
const auth = useAuth();
|
||||||
const status = auth.status;
|
const authLastUserId = auth.lastUserId;
|
||||||
const containerRef = useRef<HTMLDivElement>(null);
|
const containerRef = useRef<HTMLDivElement>(null);
|
||||||
|
const joinMutation = useRoomJoinMeeting();
|
||||||
|
const [joinedMeeting, setJoinedMeeting] = useState<Meeting | null>(null);
|
||||||
|
|
||||||
const roomUrl = meeting?.host_room_url || meeting?.room_url;
|
const roomName = params?.roomName as string;
|
||||||
|
|
||||||
const isLoading = status === "loading";
|
useEffect(() => {
|
||||||
|
if (authLastUserId === undefined || !meeting?.id || !roomName) return;
|
||||||
|
|
||||||
|
const join = async () => {
|
||||||
|
try {
|
||||||
|
const result = await joinMutation.mutateAsync({
|
||||||
|
params: {
|
||||||
|
path: {
|
||||||
|
room_name: roomName,
|
||||||
|
meeting_id: meeting.id,
|
||||||
|
},
|
||||||
|
},
|
||||||
|
});
|
||||||
|
setJoinedMeeting(result);
|
||||||
|
} catch (error) {
|
||||||
|
console.error("Failed to join meeting:", error);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
join();
|
||||||
|
}, [meeting?.id, roomName, authLastUserId]);
|
||||||
|
|
||||||
|
const roomUrl = joinedMeeting?.room_url;
|
||||||
|
|
||||||
const handleLeave = useCallback(() => {
|
const handleLeave = useCallback(() => {
|
||||||
router.push("/browse");
|
router.push("/browse");
|
||||||
}, [router]);
|
}, [router]);
|
||||||
|
|
||||||
useEffect(() => {
|
useEffect(() => {
|
||||||
if (isLoading || !roomUrl || !containerRef.current) return;
|
if (authLastUserId === undefined || !roomUrl || !containerRef.current)
|
||||||
|
return;
|
||||||
|
|
||||||
let frame: DailyCall | null = null;
|
let frame: DailyCall | null = null;
|
||||||
let destroyed = false;
|
let destroyed = false;
|
||||||
@@ -63,7 +91,15 @@ export default function DailyRoom({ meeting }: DailyRoomProps) {
|
|||||||
|
|
||||||
frame.on("joined-meeting", async () => {
|
frame.on("joined-meeting", async () => {
|
||||||
try {
|
try {
|
||||||
await frame.startRecording({ type: "raw-tracks" });
|
const frameInstance = assertExists(
|
||||||
|
frame,
|
||||||
|
"frame object got lost somewhere after frame.on was called",
|
||||||
|
);
|
||||||
|
|
||||||
|
if (meeting.recording_type === "cloud") {
|
||||||
|
console.log("Starting cloud recording");
|
||||||
|
await frameInstance.startRecording({ type: "raw-tracks" });
|
||||||
|
}
|
||||||
} catch (error) {
|
} catch (error) {
|
||||||
console.error("Failed to start recording:", error);
|
console.error("Failed to start recording:", error);
|
||||||
}
|
}
|
||||||
@@ -75,7 +111,9 @@ export default function DailyRoom({ meeting }: DailyRoomProps) {
|
|||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
createAndJoin();
|
createAndJoin().catch((error) => {
|
||||||
|
console.error("Failed to create and join meeting:", error);
|
||||||
|
});
|
||||||
|
|
||||||
return () => {
|
return () => {
|
||||||
destroyed = true;
|
destroyed = true;
|
||||||
@@ -85,7 +123,23 @@ export default function DailyRoom({ meeting }: DailyRoomProps) {
|
|||||||
});
|
});
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
}, [roomUrl, isLoading, handleLeave]);
|
}, [roomUrl, authLastUserId, handleLeave]);
|
||||||
|
|
||||||
|
if (authLastUserId === undefined) {
|
||||||
|
return (
|
||||||
|
<Center width="100vw" height="100vh">
|
||||||
|
<Spinner size="xl" />
|
||||||
|
</Center>
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (joinMutation.isError) {
|
||||||
|
return (
|
||||||
|
<Center width="100vw" height="100vh">
|
||||||
|
<Text color="red.500">Failed to join meeting. Please try again.</Text>
|
||||||
|
</Center>
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
if (!roomUrl) {
|
if (!roomUrl) {
|
||||||
return null;
|
return null;
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
"use client";
|
"use client";
|
||||||
|
|
||||||
import { createContext, useContext } from "react";
|
import { createContext, useContext, useRef } from "react";
|
||||||
import { useSession as useNextAuthSession } from "next-auth/react";
|
import { useSession as useNextAuthSession } from "next-auth/react";
|
||||||
import { signOut, signIn } from "next-auth/react";
|
import { signOut, signIn } from "next-auth/react";
|
||||||
import { configureApiAuth } from "./apiClient";
|
import { configureApiAuth } from "./apiClient";
|
||||||
@@ -25,6 +25,9 @@ type AuthContextType = (
|
|||||||
update: () => Promise<Session | null>;
|
update: () => Promise<Session | null>;
|
||||||
signIn: typeof signIn;
|
signIn: typeof signIn;
|
||||||
signOut: typeof signOut;
|
signOut: typeof signOut;
|
||||||
|
// TODO probably rename isLoading to isReloading and make THIS field "isLoading"
|
||||||
|
// undefined is "not known", null is "is certainly logged out"
|
||||||
|
lastUserId: CustomSession["user"]["id"] | null | undefined;
|
||||||
};
|
};
|
||||||
|
|
||||||
const AuthContext = createContext<AuthContextType | undefined>(undefined);
|
const AuthContext = createContext<AuthContextType | undefined>(undefined);
|
||||||
@@ -41,10 +44,15 @@ const noopAuthContext: AuthContextType = {
|
|||||||
signOut: async () => {
|
signOut: async () => {
|
||||||
throw new Error("signOut not supposed to be called");
|
throw new Error("signOut not supposed to be called");
|
||||||
},
|
},
|
||||||
|
lastUserId: undefined,
|
||||||
};
|
};
|
||||||
|
|
||||||
export function AuthProvider({ children }: { children: React.ReactNode }) {
|
export function AuthProvider({ children }: { children: React.ReactNode }) {
|
||||||
const { data: session, status, update } = useNextAuthSession();
|
const { data: session, status, update } = useNextAuthSession();
|
||||||
|
// referential comparison done in component, must be primitive /or cached
|
||||||
|
const lastUserId = useRef<CustomSession["user"]["id"] | null | undefined>(
|
||||||
|
null,
|
||||||
|
);
|
||||||
|
|
||||||
const contextValue: AuthContextType = isAuthEnabled
|
const contextValue: AuthContextType = isAuthEnabled
|
||||||
? {
|
? {
|
||||||
@@ -73,11 +81,16 @@ export function AuthProvider({ children }: { children: React.ReactNode }) {
|
|||||||
case "authenticated": {
|
case "authenticated": {
|
||||||
const customSession = assertCustomSession(session);
|
const customSession = assertCustomSession(session);
|
||||||
if (customSession?.error === REFRESH_ACCESS_TOKEN_ERROR) {
|
if (customSession?.error === REFRESH_ACCESS_TOKEN_ERROR) {
|
||||||
|
// warning: call order-dependent
|
||||||
|
lastUserId.current = null;
|
||||||
// token had expired but next auth still returns "authenticated" so show user unauthenticated state
|
// token had expired but next auth still returns "authenticated" so show user unauthenticated state
|
||||||
return {
|
return {
|
||||||
status: "unauthenticated" as const,
|
status: "unauthenticated" as const,
|
||||||
};
|
};
|
||||||
} else if (customSession?.accessToken) {
|
} else if (customSession?.accessToken) {
|
||||||
|
// updates anyways with updated properties below
|
||||||
|
// warning! execution order conscience, must be ran before reading lastUserId.current below
|
||||||
|
lastUserId.current = customSession.user.id;
|
||||||
return {
|
return {
|
||||||
status,
|
status,
|
||||||
accessToken: customSession.accessToken,
|
accessToken: customSession.accessToken,
|
||||||
@@ -92,6 +105,8 @@ export function AuthProvider({ children }: { children: React.ReactNode }) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
case "unauthenticated": {
|
case "unauthenticated": {
|
||||||
|
// warning: call order-dependent
|
||||||
|
lastUserId.current = null;
|
||||||
return { status: "unauthenticated" as const };
|
return { status: "unauthenticated" as const };
|
||||||
}
|
}
|
||||||
default: {
|
default: {
|
||||||
@@ -103,6 +118,8 @@ export function AuthProvider({ children }: { children: React.ReactNode }) {
|
|||||||
update,
|
update,
|
||||||
signIn,
|
signIn,
|
||||||
signOut,
|
signOut,
|
||||||
|
// for optimistic cases when we assume "loading" doesn't immediately invalidate the user
|
||||||
|
lastUserId: lastUserId.current,
|
||||||
}
|
}
|
||||||
: noopAuthContext;
|
: noopAuthContext;
|
||||||
|
|
||||||
|
|||||||
@@ -22,6 +22,32 @@ import { sequenceThrows } from "./errorUtils";
|
|||||||
import { featureEnabled } from "./features";
|
import { featureEnabled } from "./features";
|
||||||
import { getNextEnvVar } from "./nextBuild";
|
import { getNextEnvVar } from "./nextBuild";
|
||||||
|
|
||||||
|
async function getUserId(accessToken: string): Promise<string | null> {
|
||||||
|
try {
|
||||||
|
const apiUrl = getNextEnvVar("SERVER_API_URL");
|
||||||
|
const response = await fetch(`${apiUrl}/v1/me`, {
|
||||||
|
headers: {
|
||||||
|
Authorization: `Bearer ${accessToken}`,
|
||||||
|
},
|
||||||
|
});
|
||||||
|
|
||||||
|
if (!response.ok) {
|
||||||
|
try {
|
||||||
|
console.error(await response.text());
|
||||||
|
} catch (e) {
|
||||||
|
console.error("Failed to parse error response", e);
|
||||||
|
}
|
||||||
|
return null;
|
||||||
|
}
|
||||||
|
|
||||||
|
const userInfo = await response.json();
|
||||||
|
return userInfo.sub || null;
|
||||||
|
} catch (error) {
|
||||||
|
console.error("Error fetching user ID from backend:", error);
|
||||||
|
return null;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
const TOKEN_CACHE_TTL = REFRESH_ACCESS_TOKEN_BEFORE;
|
const TOKEN_CACHE_TTL = REFRESH_ACCESS_TOKEN_BEFORE;
|
||||||
const getAuthentikClientId = () => getNextEnvVar("AUTHENTIK_CLIENT_ID");
|
const getAuthentikClientId = () => getNextEnvVar("AUTHENTIK_CLIENT_ID");
|
||||||
const getAuthentikClientSecret = () => getNextEnvVar("AUTHENTIK_CLIENT_SECRET");
|
const getAuthentikClientSecret = () => getNextEnvVar("AUTHENTIK_CLIENT_SECRET");
|
||||||
@@ -122,13 +148,16 @@ export const authOptions = (): AuthOptions =>
|
|||||||
},
|
},
|
||||||
async session({ session, token }) {
|
async session({ session, token }) {
|
||||||
const extendedToken = token as JWTWithAccessToken;
|
const extendedToken = token as JWTWithAccessToken;
|
||||||
|
console.log("extendedToken", extendedToken);
|
||||||
|
const userId = await getUserId(extendedToken.accessToken);
|
||||||
|
|
||||||
return {
|
return {
|
||||||
...session,
|
...session,
|
||||||
accessToken: extendedToken.accessToken,
|
accessToken: extendedToken.accessToken,
|
||||||
accessTokenExpires: extendedToken.accessTokenExpires,
|
accessTokenExpires: extendedToken.accessTokenExpires,
|
||||||
error: extendedToken.error,
|
error: extendedToken.error,
|
||||||
user: {
|
user: {
|
||||||
id: assertExists(extendedToken.sub),
|
id: assertExistsAndNonEmptyString(userId, "User ID required"),
|
||||||
name: extendedToken.name,
|
name: extendedToken.name,
|
||||||
email: extendedToken.email,
|
email: extendedToken.email,
|
||||||
},
|
},
|
||||||
|
|||||||
486
www/app/reflector-api.d.ts
vendored
486
www/app/reflector-api.d.ts
vendored
@@ -696,7 +696,7 @@ export interface paths {
|
|||||||
patch?: never;
|
patch?: never;
|
||||||
trace?: never;
|
trace?: never;
|
||||||
};
|
};
|
||||||
"/v1/webhook": {
|
"/v1/daily/webhook": {
|
||||||
parameters: {
|
parameters: {
|
||||||
query?: never;
|
query?: never;
|
||||||
header?: never;
|
header?: never;
|
||||||
@@ -708,6 +708,27 @@ export interface paths {
|
|||||||
/**
|
/**
|
||||||
* Webhook
|
* Webhook
|
||||||
* @description Handle Daily webhook events.
|
* @description Handle Daily webhook events.
|
||||||
|
*
|
||||||
|
* Example webhook payload:
|
||||||
|
* {
|
||||||
|
* "version": "1.0.0",
|
||||||
|
* "type": "recording.ready-to-download",
|
||||||
|
* "id": "rec-rtd-c3df927c-f738-4471-a2b7-066fa7e95a6b-1692124192",
|
||||||
|
* "payload": {
|
||||||
|
* "recording_id": "08fa0b24-9220-44c5-846c-3f116cf8e738",
|
||||||
|
* "room_name": "Xcm97xRZ08b2dePKb78g",
|
||||||
|
* "start_ts": 1692124183,
|
||||||
|
* "status": "finished",
|
||||||
|
* "max_participants": 1,
|
||||||
|
* "duration": 9,
|
||||||
|
* "share_token": "ntDCL5k98Ulq", #gitleaks:allow
|
||||||
|
* "s3_key": "api-test-1j8fizhzd30c/Xcm97xRZ08b2dePKb78g/1692124183028"
|
||||||
|
* },
|
||||||
|
* "event_ts": 1692124192
|
||||||
|
* }
|
||||||
|
*
|
||||||
|
* Daily.co circuit-breaker: After 3+ failed responses (4xx/5xx), webhook
|
||||||
|
* state→FAILED, stops sending events. Reset: scripts/recreate_daily_webhook.py
|
||||||
*/
|
*/
|
||||||
post: operations["v1_webhook"];
|
post: operations["v1_webhook"];
|
||||||
delete?: never;
|
delete?: never;
|
||||||
@@ -899,81 +920,11 @@ export interface components {
|
|||||||
target_language: string;
|
target_language: string;
|
||||||
source_kind?: components["schemas"]["SourceKind"] | null;
|
source_kind?: components["schemas"]["SourceKind"] | null;
|
||||||
};
|
};
|
||||||
/**
|
|
||||||
* DailyWebhookEvent
|
|
||||||
* @description Daily webhook event structure.
|
|
||||||
*/
|
|
||||||
DailyWebhookEvent: {
|
|
||||||
/** Type */
|
|
||||||
type: string;
|
|
||||||
/** Id */
|
|
||||||
id: string;
|
|
||||||
/** Ts */
|
|
||||||
ts: number;
|
|
||||||
/** Data */
|
|
||||||
data: {
|
|
||||||
[key: string]: unknown;
|
|
||||||
};
|
|
||||||
};
|
|
||||||
/** DeletionStatus */
|
/** DeletionStatus */
|
||||||
DeletionStatus: {
|
DeletionStatus: {
|
||||||
/** Status */
|
/** Status */
|
||||||
status: string;
|
status: string;
|
||||||
};
|
};
|
||||||
/** GetTranscript */
|
|
||||||
GetTranscript: {
|
|
||||||
/** Id */
|
|
||||||
id: string;
|
|
||||||
/** User Id */
|
|
||||||
user_id: string | null;
|
|
||||||
/** Name */
|
|
||||||
name: string;
|
|
||||||
/**
|
|
||||||
* Status
|
|
||||||
* @enum {string}
|
|
||||||
*/
|
|
||||||
status:
|
|
||||||
| "idle"
|
|
||||||
| "uploaded"
|
|
||||||
| "recording"
|
|
||||||
| "processing"
|
|
||||||
| "error"
|
|
||||||
| "ended";
|
|
||||||
/** Locked */
|
|
||||||
locked: boolean;
|
|
||||||
/** Duration */
|
|
||||||
duration: number;
|
|
||||||
/** Title */
|
|
||||||
title: string | null;
|
|
||||||
/** Short Summary */
|
|
||||||
short_summary: string | null;
|
|
||||||
/** Long Summary */
|
|
||||||
long_summary: string | null;
|
|
||||||
/** Created At */
|
|
||||||
created_at: string;
|
|
||||||
/**
|
|
||||||
* Share Mode
|
|
||||||
* @default private
|
|
||||||
*/
|
|
||||||
share_mode: string;
|
|
||||||
/** Source Language */
|
|
||||||
source_language: string | null;
|
|
||||||
/** Target Language */
|
|
||||||
target_language: string | null;
|
|
||||||
/** Reviewed */
|
|
||||||
reviewed: boolean;
|
|
||||||
/** Meeting Id */
|
|
||||||
meeting_id: string | null;
|
|
||||||
source_kind: components["schemas"]["SourceKind"];
|
|
||||||
/** Room Id */
|
|
||||||
room_id?: string | null;
|
|
||||||
/** Room Name */
|
|
||||||
room_name?: string | null;
|
|
||||||
/** Audio Deleted */
|
|
||||||
audio_deleted?: boolean | null;
|
|
||||||
/** Participants */
|
|
||||||
participants: components["schemas"]["TranscriptParticipant"][] | null;
|
|
||||||
};
|
|
||||||
/** GetTranscriptMinimal */
|
/** GetTranscriptMinimal */
|
||||||
GetTranscriptMinimal: {
|
GetTranscriptMinimal: {
|
||||||
/** Id */
|
/** Id */
|
||||||
@@ -1105,6 +1056,345 @@ export interface components {
|
|||||||
*/
|
*/
|
||||||
words_per_speaker: components["schemas"]["SpeakerWords"][];
|
words_per_speaker: components["schemas"]["SpeakerWords"][];
|
||||||
};
|
};
|
||||||
|
/**
|
||||||
|
* GetTranscriptWithJSON
|
||||||
|
* @description Transcript response as structured JSON segments.
|
||||||
|
*
|
||||||
|
* Format: Array of segment objects with speaker info, text, and timing.
|
||||||
|
* Example:
|
||||||
|
* [
|
||||||
|
* {
|
||||||
|
* "speaker": 0,
|
||||||
|
* "speaker_name": "John Smith",
|
||||||
|
* "text": "Hello everyone",
|
||||||
|
* "start": 0.0,
|
||||||
|
* "end": 5.0
|
||||||
|
* }
|
||||||
|
* ]
|
||||||
|
*/
|
||||||
|
GetTranscriptWithJSON: {
|
||||||
|
/** Id */
|
||||||
|
id: string;
|
||||||
|
/** User Id */
|
||||||
|
user_id: string | null;
|
||||||
|
/** Name */
|
||||||
|
name: string;
|
||||||
|
/**
|
||||||
|
* Status
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
status:
|
||||||
|
| "idle"
|
||||||
|
| "uploaded"
|
||||||
|
| "recording"
|
||||||
|
| "processing"
|
||||||
|
| "error"
|
||||||
|
| "ended";
|
||||||
|
/** Locked */
|
||||||
|
locked: boolean;
|
||||||
|
/** Duration */
|
||||||
|
duration: number;
|
||||||
|
/** Title */
|
||||||
|
title: string | null;
|
||||||
|
/** Short Summary */
|
||||||
|
short_summary: string | null;
|
||||||
|
/** Long Summary */
|
||||||
|
long_summary: string | null;
|
||||||
|
/** Created At */
|
||||||
|
created_at: string;
|
||||||
|
/**
|
||||||
|
* Share Mode
|
||||||
|
* @default private
|
||||||
|
*/
|
||||||
|
share_mode: string;
|
||||||
|
/** Source Language */
|
||||||
|
source_language: string | null;
|
||||||
|
/** Target Language */
|
||||||
|
target_language: string | null;
|
||||||
|
/** Reviewed */
|
||||||
|
reviewed: boolean;
|
||||||
|
/** Meeting Id */
|
||||||
|
meeting_id: string | null;
|
||||||
|
source_kind: components["schemas"]["SourceKind"];
|
||||||
|
/** Room Id */
|
||||||
|
room_id?: string | null;
|
||||||
|
/** Room Name */
|
||||||
|
room_name?: string | null;
|
||||||
|
/** Audio Deleted */
|
||||||
|
audio_deleted?: boolean | null;
|
||||||
|
/** Participants */
|
||||||
|
participants: components["schemas"]["TranscriptParticipant"][] | null;
|
||||||
|
/**
|
||||||
|
* @description discriminator enum property added by openapi-typescript
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
transcript_format: "json";
|
||||||
|
/** Transcript */
|
||||||
|
transcript: components["schemas"]["TranscriptSegment"][];
|
||||||
|
};
|
||||||
|
/** GetTranscriptWithParticipants */
|
||||||
|
GetTranscriptWithParticipants: {
|
||||||
|
/** Id */
|
||||||
|
id: string;
|
||||||
|
/** User Id */
|
||||||
|
user_id: string | null;
|
||||||
|
/** Name */
|
||||||
|
name: string;
|
||||||
|
/**
|
||||||
|
* Status
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
status:
|
||||||
|
| "idle"
|
||||||
|
| "uploaded"
|
||||||
|
| "recording"
|
||||||
|
| "processing"
|
||||||
|
| "error"
|
||||||
|
| "ended";
|
||||||
|
/** Locked */
|
||||||
|
locked: boolean;
|
||||||
|
/** Duration */
|
||||||
|
duration: number;
|
||||||
|
/** Title */
|
||||||
|
title: string | null;
|
||||||
|
/** Short Summary */
|
||||||
|
short_summary: string | null;
|
||||||
|
/** Long Summary */
|
||||||
|
long_summary: string | null;
|
||||||
|
/** Created At */
|
||||||
|
created_at: string;
|
||||||
|
/**
|
||||||
|
* Share Mode
|
||||||
|
* @default private
|
||||||
|
*/
|
||||||
|
share_mode: string;
|
||||||
|
/** Source Language */
|
||||||
|
source_language: string | null;
|
||||||
|
/** Target Language */
|
||||||
|
target_language: string | null;
|
||||||
|
/** Reviewed */
|
||||||
|
reviewed: boolean;
|
||||||
|
/** Meeting Id */
|
||||||
|
meeting_id: string | null;
|
||||||
|
source_kind: components["schemas"]["SourceKind"];
|
||||||
|
/** Room Id */
|
||||||
|
room_id?: string | null;
|
||||||
|
/** Room Name */
|
||||||
|
room_name?: string | null;
|
||||||
|
/** Audio Deleted */
|
||||||
|
audio_deleted?: boolean | null;
|
||||||
|
/** Participants */
|
||||||
|
participants: components["schemas"]["TranscriptParticipant"][] | null;
|
||||||
|
};
|
||||||
|
/**
|
||||||
|
* GetTranscriptWithText
|
||||||
|
* @description Transcript response with plain text format.
|
||||||
|
*
|
||||||
|
* Format: Speaker names followed by their dialogue, one line per segment.
|
||||||
|
* Example:
|
||||||
|
* John Smith: Hello everyone
|
||||||
|
* Jane Doe: Hi there
|
||||||
|
*/
|
||||||
|
GetTranscriptWithText: {
|
||||||
|
/** Id */
|
||||||
|
id: string;
|
||||||
|
/** User Id */
|
||||||
|
user_id: string | null;
|
||||||
|
/** Name */
|
||||||
|
name: string;
|
||||||
|
/**
|
||||||
|
* Status
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
status:
|
||||||
|
| "idle"
|
||||||
|
| "uploaded"
|
||||||
|
| "recording"
|
||||||
|
| "processing"
|
||||||
|
| "error"
|
||||||
|
| "ended";
|
||||||
|
/** Locked */
|
||||||
|
locked: boolean;
|
||||||
|
/** Duration */
|
||||||
|
duration: number;
|
||||||
|
/** Title */
|
||||||
|
title: string | null;
|
||||||
|
/** Short Summary */
|
||||||
|
short_summary: string | null;
|
||||||
|
/** Long Summary */
|
||||||
|
long_summary: string | null;
|
||||||
|
/** Created At */
|
||||||
|
created_at: string;
|
||||||
|
/**
|
||||||
|
* Share Mode
|
||||||
|
* @default private
|
||||||
|
*/
|
||||||
|
share_mode: string;
|
||||||
|
/** Source Language */
|
||||||
|
source_language: string | null;
|
||||||
|
/** Target Language */
|
||||||
|
target_language: string | null;
|
||||||
|
/** Reviewed */
|
||||||
|
reviewed: boolean;
|
||||||
|
/** Meeting Id */
|
||||||
|
meeting_id: string | null;
|
||||||
|
source_kind: components["schemas"]["SourceKind"];
|
||||||
|
/** Room Id */
|
||||||
|
room_id?: string | null;
|
||||||
|
/** Room Name */
|
||||||
|
room_name?: string | null;
|
||||||
|
/** Audio Deleted */
|
||||||
|
audio_deleted?: boolean | null;
|
||||||
|
/** Participants */
|
||||||
|
participants: components["schemas"]["TranscriptParticipant"][] | null;
|
||||||
|
/**
|
||||||
|
* @description discriminator enum property added by openapi-typescript
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
transcript_format: "text";
|
||||||
|
/** Transcript */
|
||||||
|
transcript: string;
|
||||||
|
};
|
||||||
|
/**
|
||||||
|
* GetTranscriptWithTextTimestamped
|
||||||
|
* @description Transcript response with timestamped text format.
|
||||||
|
*
|
||||||
|
* Format: [MM:SS] timestamp prefix before each speaker and dialogue.
|
||||||
|
* Example:
|
||||||
|
* [00:00] John Smith: Hello everyone
|
||||||
|
* [00:05] Jane Doe: Hi there
|
||||||
|
*/
|
||||||
|
GetTranscriptWithTextTimestamped: {
|
||||||
|
/** Id */
|
||||||
|
id: string;
|
||||||
|
/** User Id */
|
||||||
|
user_id: string | null;
|
||||||
|
/** Name */
|
||||||
|
name: string;
|
||||||
|
/**
|
||||||
|
* Status
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
status:
|
||||||
|
| "idle"
|
||||||
|
| "uploaded"
|
||||||
|
| "recording"
|
||||||
|
| "processing"
|
||||||
|
| "error"
|
||||||
|
| "ended";
|
||||||
|
/** Locked */
|
||||||
|
locked: boolean;
|
||||||
|
/** Duration */
|
||||||
|
duration: number;
|
||||||
|
/** Title */
|
||||||
|
title: string | null;
|
||||||
|
/** Short Summary */
|
||||||
|
short_summary: string | null;
|
||||||
|
/** Long Summary */
|
||||||
|
long_summary: string | null;
|
||||||
|
/** Created At */
|
||||||
|
created_at: string;
|
||||||
|
/**
|
||||||
|
* Share Mode
|
||||||
|
* @default private
|
||||||
|
*/
|
||||||
|
share_mode: string;
|
||||||
|
/** Source Language */
|
||||||
|
source_language: string | null;
|
||||||
|
/** Target Language */
|
||||||
|
target_language: string | null;
|
||||||
|
/** Reviewed */
|
||||||
|
reviewed: boolean;
|
||||||
|
/** Meeting Id */
|
||||||
|
meeting_id: string | null;
|
||||||
|
source_kind: components["schemas"]["SourceKind"];
|
||||||
|
/** Room Id */
|
||||||
|
room_id?: string | null;
|
||||||
|
/** Room Name */
|
||||||
|
room_name?: string | null;
|
||||||
|
/** Audio Deleted */
|
||||||
|
audio_deleted?: boolean | null;
|
||||||
|
/** Participants */
|
||||||
|
participants: components["schemas"]["TranscriptParticipant"][] | null;
|
||||||
|
/**
|
||||||
|
* @description discriminator enum property added by openapi-typescript
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
transcript_format: "text-timestamped";
|
||||||
|
/** Transcript */
|
||||||
|
transcript: string;
|
||||||
|
};
|
||||||
|
/**
|
||||||
|
* GetTranscriptWithWebVTTNamed
|
||||||
|
* @description Transcript response in WebVTT subtitle format with participant names.
|
||||||
|
*
|
||||||
|
* Format: Standard WebVTT with voice tags using participant names.
|
||||||
|
* Example:
|
||||||
|
* WEBVTT
|
||||||
|
*
|
||||||
|
* 00:00:00.000 --> 00:00:05.000
|
||||||
|
* <v John Smith>Hello everyone
|
||||||
|
*/
|
||||||
|
GetTranscriptWithWebVTTNamed: {
|
||||||
|
/** Id */
|
||||||
|
id: string;
|
||||||
|
/** User Id */
|
||||||
|
user_id: string | null;
|
||||||
|
/** Name */
|
||||||
|
name: string;
|
||||||
|
/**
|
||||||
|
* Status
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
status:
|
||||||
|
| "idle"
|
||||||
|
| "uploaded"
|
||||||
|
| "recording"
|
||||||
|
| "processing"
|
||||||
|
| "error"
|
||||||
|
| "ended";
|
||||||
|
/** Locked */
|
||||||
|
locked: boolean;
|
||||||
|
/** Duration */
|
||||||
|
duration: number;
|
||||||
|
/** Title */
|
||||||
|
title: string | null;
|
||||||
|
/** Short Summary */
|
||||||
|
short_summary: string | null;
|
||||||
|
/** Long Summary */
|
||||||
|
long_summary: string | null;
|
||||||
|
/** Created At */
|
||||||
|
created_at: string;
|
||||||
|
/**
|
||||||
|
* Share Mode
|
||||||
|
* @default private
|
||||||
|
*/
|
||||||
|
share_mode: string;
|
||||||
|
/** Source Language */
|
||||||
|
source_language: string | null;
|
||||||
|
/** Target Language */
|
||||||
|
target_language: string | null;
|
||||||
|
/** Reviewed */
|
||||||
|
reviewed: boolean;
|
||||||
|
/** Meeting Id */
|
||||||
|
meeting_id: string | null;
|
||||||
|
source_kind: components["schemas"]["SourceKind"];
|
||||||
|
/** Room Id */
|
||||||
|
room_id?: string | null;
|
||||||
|
/** Room Name */
|
||||||
|
room_name?: string | null;
|
||||||
|
/** Audio Deleted */
|
||||||
|
audio_deleted?: boolean | null;
|
||||||
|
/** Participants */
|
||||||
|
participants: components["schemas"]["TranscriptParticipant"][] | null;
|
||||||
|
/**
|
||||||
|
* @description discriminator enum property added by openapi-typescript
|
||||||
|
* @enum {string}
|
||||||
|
*/
|
||||||
|
transcript_format: "webvtt-named";
|
||||||
|
/** Transcript */
|
||||||
|
transcript: string;
|
||||||
|
};
|
||||||
/** HTTPValidationError */
|
/** HTTPValidationError */
|
||||||
HTTPValidationError: {
|
HTTPValidationError: {
|
||||||
/** Detail */
|
/** Detail */
|
||||||
@@ -1233,7 +1523,6 @@ export interface components {
|
|||||||
} | null;
|
} | null;
|
||||||
/**
|
/**
|
||||||
* Platform
|
* Platform
|
||||||
* @default whereby
|
|
||||||
* @enum {string}
|
* @enum {string}
|
||||||
*/
|
*/
|
||||||
platform: "whereby" | "daily";
|
platform: "whereby" | "daily";
|
||||||
@@ -1325,7 +1614,6 @@ export interface components {
|
|||||||
ics_last_etag?: string | null;
|
ics_last_etag?: string | null;
|
||||||
/**
|
/**
|
||||||
* Platform
|
* Platform
|
||||||
* @default whereby
|
|
||||||
* @enum {string}
|
* @enum {string}
|
||||||
*/
|
*/
|
||||||
platform: "whereby" | "daily";
|
platform: "whereby" | "daily";
|
||||||
@@ -1377,7 +1665,6 @@ export interface components {
|
|||||||
ics_last_etag?: string | null;
|
ics_last_etag?: string | null;
|
||||||
/**
|
/**
|
||||||
* Platform
|
* Platform
|
||||||
* @default whereby
|
|
||||||
* @enum {string}
|
* @enum {string}
|
||||||
*/
|
*/
|
||||||
platform: "whereby" | "daily";
|
platform: "whereby" | "daily";
|
||||||
@@ -1523,6 +1810,24 @@ export interface components {
|
|||||||
speaker: number | null;
|
speaker: number | null;
|
||||||
/** Name */
|
/** Name */
|
||||||
name: string;
|
name: string;
|
||||||
|
/** User Id */
|
||||||
|
user_id?: string | null;
|
||||||
|
};
|
||||||
|
/**
|
||||||
|
* TranscriptSegment
|
||||||
|
* @description A single transcript segment with speaker and timing information.
|
||||||
|
*/
|
||||||
|
TranscriptSegment: {
|
||||||
|
/** Speaker */
|
||||||
|
speaker: number;
|
||||||
|
/** Speaker Name */
|
||||||
|
speaker_name: string;
|
||||||
|
/** Text */
|
||||||
|
text: string;
|
||||||
|
/** Start */
|
||||||
|
start: number;
|
||||||
|
/** End */
|
||||||
|
end: number;
|
||||||
};
|
};
|
||||||
/** UpdateParticipant */
|
/** UpdateParticipant */
|
||||||
UpdateParticipant: {
|
UpdateParticipant: {
|
||||||
@@ -2311,7 +2616,7 @@ export interface operations {
|
|||||||
[name: string]: unknown;
|
[name: string]: unknown;
|
||||||
};
|
};
|
||||||
content: {
|
content: {
|
||||||
"application/json": components["schemas"]["GetTranscript"];
|
"application/json": components["schemas"]["GetTranscriptWithParticipants"];
|
||||||
};
|
};
|
||||||
};
|
};
|
||||||
/** @description Validation Error */
|
/** @description Validation Error */
|
||||||
@@ -2369,7 +2674,13 @@ export interface operations {
|
|||||||
};
|
};
|
||||||
v1_transcript_get: {
|
v1_transcript_get: {
|
||||||
parameters: {
|
parameters: {
|
||||||
query?: never;
|
query?: {
|
||||||
|
transcript_format?:
|
||||||
|
| "text"
|
||||||
|
| "text-timestamped"
|
||||||
|
| "webvtt-named"
|
||||||
|
| "json";
|
||||||
|
};
|
||||||
header?: never;
|
header?: never;
|
||||||
path: {
|
path: {
|
||||||
transcript_id: string;
|
transcript_id: string;
|
||||||
@@ -2384,7 +2695,11 @@ export interface operations {
|
|||||||
[name: string]: unknown;
|
[name: string]: unknown;
|
||||||
};
|
};
|
||||||
content: {
|
content: {
|
||||||
"application/json": components["schemas"]["GetTranscript"];
|
"application/json":
|
||||||
|
| components["schemas"]["GetTranscriptWithText"]
|
||||||
|
| components["schemas"]["GetTranscriptWithTextTimestamped"]
|
||||||
|
| components["schemas"]["GetTranscriptWithWebVTTNamed"]
|
||||||
|
| components["schemas"]["GetTranscriptWithJSON"];
|
||||||
};
|
};
|
||||||
};
|
};
|
||||||
/** @description Validation Error */
|
/** @description Validation Error */
|
||||||
@@ -2450,7 +2765,7 @@ export interface operations {
|
|||||||
[name: string]: unknown;
|
[name: string]: unknown;
|
||||||
};
|
};
|
||||||
content: {
|
content: {
|
||||||
"application/json": components["schemas"]["GetTranscript"];
|
"application/json": components["schemas"]["GetTranscriptWithParticipants"];
|
||||||
};
|
};
|
||||||
};
|
};
|
||||||
/** @description Validation Error */
|
/** @description Validation Error */
|
||||||
@@ -3256,11 +3571,7 @@ export interface operations {
|
|||||||
path?: never;
|
path?: never;
|
||||||
cookie?: never;
|
cookie?: never;
|
||||||
};
|
};
|
||||||
requestBody: {
|
requestBody?: never;
|
||||||
content: {
|
|
||||||
"application/json": components["schemas"]["DailyWebhookEvent"];
|
|
||||||
};
|
|
||||||
};
|
|
||||||
responses: {
|
responses: {
|
||||||
/** @description Successful Response */
|
/** @description Successful Response */
|
||||||
200: {
|
200: {
|
||||||
@@ -3271,15 +3582,6 @@ export interface operations {
|
|||||||
"application/json": unknown;
|
"application/json": unknown;
|
||||||
};
|
};
|
||||||
};
|
};
|
||||||
/** @description Validation Error */
|
|
||||||
422: {
|
|
||||||
headers: {
|
|
||||||
[name: string]: unknown;
|
|
||||||
};
|
|
||||||
content: {
|
|
||||||
"application/json": components["schemas"]["HTTPValidationError"];
|
|
||||||
};
|
|
||||||
};
|
|
||||||
};
|
};
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|||||||
Reference in New Issue
Block a user