mirror of
https://github.com/Monadical-SAS/reflector.git
synced 2025-12-20 20:29:06 +00:00
add start end tags and stats
This commit is contained in:
@@ -47,4 +47,5 @@ scattertext
|
|||||||
pandas
|
pandas
|
||||||
jupyter
|
jupyter
|
||||||
seaborn
|
seaborn
|
||||||
matplotlib
|
matplotlib
|
||||||
|
termcolor
|
||||||
@@ -12,6 +12,9 @@ from viz_utilities import create_wordcloud, create_talk_diff_scatter_viz
|
|||||||
from text_utilities import summarize, post_process_transcription
|
from text_utilities import summarize, post_process_transcription
|
||||||
from loguru import logger
|
from loguru import logger
|
||||||
import nltk
|
import nltk
|
||||||
|
import time
|
||||||
|
from termcolor import colored
|
||||||
|
|
||||||
nltk.download('stopwords', quiet=True)
|
nltk.download('stopwords', quiet=True)
|
||||||
|
|
||||||
config = configparser.ConfigParser()
|
config = configparser.ConfigParser()
|
||||||
@@ -68,9 +71,11 @@ def main():
|
|||||||
try:
|
try:
|
||||||
while proceed:
|
while proceed:
|
||||||
frames = []
|
frames = []
|
||||||
|
start_time = time.time()
|
||||||
for i in range(0, int(RATE / FRAMES_PER_BUFFER * RECORD_SECONDS)):
|
for i in range(0, int(RATE / FRAMES_PER_BUFFER * RECORD_SECONDS)):
|
||||||
data = stream.read(FRAMES_PER_BUFFER, exception_on_overflow=False)
|
data = stream.read(FRAMES_PER_BUFFER, exception_on_overflow=False)
|
||||||
frames.append(data)
|
frames.append(data)
|
||||||
|
end_time = time.time()
|
||||||
|
|
||||||
wf = wave.open(TEMP_AUDIO_FILE, 'wb')
|
wf = wave.open(TEMP_AUDIO_FILE, 'wb')
|
||||||
wf.setnchannels(CHANNELS)
|
wf.setnchannels(CHANNELS)
|
||||||
@@ -80,8 +85,6 @@ def main():
|
|||||||
wf.close()
|
wf.close()
|
||||||
|
|
||||||
whisper_result = pipeline(TEMP_AUDIO_FILE, return_timestamps=True)
|
whisper_result = pipeline(TEMP_AUDIO_FILE, return_timestamps=True)
|
||||||
print(whisper_result['text'])
|
|
||||||
|
|
||||||
timestamp = whisper_result["chunks"][0]["timestamp"]
|
timestamp = whisper_result["chunks"][0]["timestamp"]
|
||||||
start = timestamp[0]
|
start = timestamp[0]
|
||||||
end = timestamp[1]
|
end = timestamp[1]
|
||||||
@@ -89,12 +92,18 @@ def main():
|
|||||||
end = start + 15.0
|
end = start + 15.0
|
||||||
duration = end - start
|
duration = end - start
|
||||||
item = {'timestamp': (last_transcribed_time, last_transcribed_time + duration),
|
item = {'timestamp': (last_transcribed_time, last_transcribed_time + duration),
|
||||||
'text': whisper_result['text']}
|
'text': whisper_result['text'],
|
||||||
|
'stats': (str(end_time - start_time), str(duration))
|
||||||
|
}
|
||||||
last_transcribed_time = last_transcribed_time + duration
|
last_transcribed_time = last_transcribed_time + duration
|
||||||
transcript_with_timestamp["chunks"].append(item)
|
transcript_with_timestamp["chunks"].append(item)
|
||||||
|
|
||||||
transcription += whisper_result['text']
|
transcription += whisper_result['text']
|
||||||
|
|
||||||
|
print(colored("<START>", "yellow"))
|
||||||
|
print(colored(whisper_result['text'], 'green'))
|
||||||
|
print(colored("<END> Recorded duration: " + str(end_time - start_time) + " | Transcribed duration: " +
|
||||||
|
str(duration), "yellow"))
|
||||||
|
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
print(e)
|
print(e)
|
||||||
finally:
|
finally:
|
||||||
|
|||||||
Reference in New Issue
Block a user