Skip to content

Commit 4b2e530

Browse files
committed
updated script for getting transcript
1 parent 21faa8c commit 4b2e530

2 files changed

Lines changed: 25 additions & 0 deletions

File tree

movie_py_explored/get_script.py

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
from moviepy import VideoFileClip, TextClip, CompositeVideoClip
2+
from faster_whisper import WhisperModel
3+
4+
# Load video and extract audio
5+
video = VideoFileClip("./sales_training_awareness_src.mp4")
6+
video.audio.write_audiofile("sales_training_awareness.wav") # type: ignore
7+
8+
# Transcribe with faster-whisper
9+
model = WhisperModel("small") # You can use 'small' or 'medium' if needed
10+
segments, _ = model.transcribe("sales_training_awareness.wav")
11+
# print(f"Segments are: {segments}")
12+
13+
# Build typewriter subtitles for all segments
14+
subtitle_clips = []
15+
with open("subtitle.srt", 'w') as fsrt:
16+
for idx, segment in enumerate(segments):
17+
fsrt.write(f"{segment.text} : {segment.start}, {segment.end - segment.start}")
18+
subtitle_clips.append([segment.text, segment.start, segment.end - segment.start])
19+
if idx % 5 == 0:
20+
print(f"At idx: {idx}")
21+
break
22+
23+
24+
print("Writing Extracted Subtitle:")
25+
print(subtitle_clips)

movie_py_explored/result.mp4

-7.37 MB
Binary file not shown.

0 commit comments

Comments
 (0)