insightbuilder
diff --git a/‎movie_py_explored/auto_transcript_extract.py‎
Lines changed: 167 additions & 0 deletions b/‎movie_py_explored/auto_transcript_extract.py‎
Lines changed: 167 additions & 0 deletions
diff --git a/‎movie_py_explored/pjt1/Bebas-Regular.ttf‎
17 KB b/‎movie_py_explored/pjt1/Bebas-Regular.ttf‎
17 KB
diff --git a/‎movie_py_explored/pjt1/comp1.mp4‎
2.01 MB b/‎movie_py_explored/pjt1/comp1.mp4‎
2.01 MB
diff --git a/‎movie_py_explored/pjt1/explanation.wav‎
2.97 MB b/‎movie_py_explored/pjt1/explanation.wav‎
2.97 MB
diff --git a/‎movie_py_explored/pjt1/pjt1.py‎
Lines changed: 81 additions & 0 deletions b/‎movie_py_explored/pjt1/pjt1.py‎
Lines changed: 81 additions & 0 deletions
diff --git a/‎movie_py_explored/pjt1/pjt_bg.png‎
2.92 MB b/‎movie_py_explored/pjt1/pjt_bg.png‎
2.92 MB
diff --git a/‎movie_py_explored/pjt1/registration.mp4‎
3.33 MB b/‎movie_py_explored/pjt1/registration.mp4‎
3.33 MB
diff --git a/‎movie_py_explored/pjt1/simple_img_text.py‎
Lines changed: 15 additions & 0 deletions b/‎movie_py_explored/pjt1/simple_img_text.py‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎movie_py_explored/pjt1/simple_vid.mp4‎
2.53 MB b/‎movie_py_explored/pjt1/simple_vid.mp4‎
2.53 MB
diff --git a/‎movie_py_explored/pjt1/simple_vid_text.py‎
Lines changed: 15 additions & 0 deletions b/‎movie_py_explored/pjt1/simple_vid_text.py‎
Lines changed: 15 additions & 0 deletions
@@ -0,0 +1,167 @@
+# /// script
+# requires-python = ">=3.13"
+# dependencies = [
+#     "moviepy",
+#     "faster_whisper",
+#     "pydub",
+#     "onnxruntime",
+#     "prompt_toolkit",
+#     "openai",
+#     "requests"
+# ]
+# ///
+
+from moviepy import VideoFileClip
+from faster_whisper import WhisperModel
+from prompt_toolkit import prompt
+from prompt_toolkit.completion import PathCompleter
+from pathlib import Path
+import openai
+
+import requests
+import os
+
+from pydantic import BaseModel
+from typing import List
+
+from uuid import uuid4
+
+
+class ScriptSegment(BaseModel):
+    scene: str
+    kecs: List[str]
+
+
+class Segment(BaseModel):
+    logicalparts: List[str]
+
+
+PEXELS_API_KEY = os.getenv("PEXELS_API_KEY")  # Set this in your environment
+PEXELS_SEARCH_URL = "https://api.pexels.com/videos/search"
+
+HEADERS = {"Authorization": PEXELS_API_KEY}
+
+
+def search_and_download_pexels_videos(
+    kecs, output_dir="pexels_downloads", max_per_term=2
+):
+    os.makedirs(output_dir, exist_ok=True)
+
+    for term in kecs:
+        print(f"\n🔍 Searching Pexels for: {term}")
+        params = {"query": term, "per_page": max_per_term}
+        response = requests.get(PEXELS_SEARCH_URL, headers=HEADERS, params=params)
+
+        if response.status_code != 200:
+            print(f"❌ Error searching '{term}': {response.text}")
+            continue
+
+        videos = response.json().get("videos", [])
+        for video in videos:
+            url = video["video_files"][0]["link"]
+            ext = url.split("?")[0].split(".")[-1]
+            idx = str(uuid4())[:4]
+            filename = f"{term.replace(' ', '_')}_{idx}.{ext}"
+
+            print(f"⬇️ Downloading: {filename}")
+            vid_data = requests.get(url)
+            with open(os.path.join(output_dir, filename), "wb") as f:
+                f.write(vid_data.content)
+
+
+def select_mp4_file():
+    print("Enter path to .mp4 file (Tab to autocomplete):")
+    completer = PathCompleter(only_directories=False)
+    path = prompt("File: ", completer=completer)
+
+    if path.lower().endswith(".mp4") and Path(path).exists():
+        return path
+    else:
+        print("Invalid or non-existent file.")
+        return None
+
+
+def extract_audio(mp4_path, audio_path="extracted_audio.wav"):
+    video = VideoFileClip(mp4_path)
+    video.audio.write_audiofile(audio_path, codec="pcm_s16le")  # saves as WAV
+    return audio_path
+
+
+def transcribe(audio_path, model_size="base"):
+    model = WhisperModel(
+        model_size, compute_type="int8"
+    )  # use "float16" if you have GPU
+    segments, _ = model.transcribe(audio_path)
+
+    transcript = ""
+    for segment in segments:
+        transcript += f"{segment.text.strip()} "
+    return transcript.strip()
+
+
+def write_transcript(transcript, transcript_file="transcript.txt"):
+    with open(transcript_file, "w") as f:
+        f.write(transcript)
+
+
+def extract_segments(transcript: str):
+    SYSTEM_PROMPT = """
+You are a script analysis tool. Given a transcript, break it down into logical parts like scenes or topic sections of a script.
+return:
+- logicalparts: a list of parts from the given transcript.
+
+Only respond in the provided JSON schema. No explanation.
+"""
+
+    client = openai.OpenAI()
+    response = client.beta.chat.completions.parse(
+        model="gpt-4o-mini-2024-07-18",
+        messages=[
+            {"role": "system", "content": SYSTEM_PROMPT},
+            {"role": "user", "content": transcript},
+        ],
+        temperature=0.5,
+        response_format=Segment,
+    )
+
+    return response.choices[0].message.parsed
+
+
+def extract_kecs(scene: str):
+    SYSTEM_PROMPT = """
+You are a script analysis tool. Given a scene you have to provide the visual search keywords.
+return:
+- scene: the given scene 
+- kecs: a list of 3 visual search keywords (KECs) that best represent the scene. Don't include character names, or other PIIs.
+
+Only respond in the provided JSON schema. No explanation.
+"""
+
+    client = openai.OpenAI()
+    response = client.beta.chat.completions.parse(
+        model="gpt-4o-mini-2024-07-18",
+        messages=[
+            {"role": "system", "content": SYSTEM_PROMPT},
+            {"role": "user", "content": f"The given scene is: {scene}"},
+        ],
+        temperature=0.5,
+        response_format=ScriptSegment,
+    )
+
+    return response.choices[0].message.parsed
+
+
+if __name__ == "__main__":
+    mp4_path = select_mp4_file()
+    if not mp4_path:
+        exit()
+
+    print(f"Selected: {mp4_path}")
+    audio_path = extract_audio(mp4_path)
+
+    print("Transcribing...")
+    transcript = transcribe(audio_path)
+
+    print("\n--- Transcript ---\n")
+    print(transcript)
+    write_transcript(transcript)
@@ -0,0 +1,81 @@
+from moviepy import * # type: ignore
+import numpy as np
+
+# starts with image clip
+
+bg_image = ImageClip("pjt_bg.png").with_duration(110)
+
+# bg_image.preview(fps=10)
+
+topic_expl_list = [
+    "Studying in top U.S. institutions connects you with motivated, driven peers—your future collaborators, co-founders, and lifelong professional network.",
+    "Alumni from top universities often occupy leadership roles across industries, offering mentorship, referrals, and career opportunities for new graduates.",
+    "Graduates from U.S. institutions often land jobs with competitive starting packages, thanks to strong brand value and skill-based training.",
+    "The culture encourages excellence, critical thinking, and resilience—building the mindset that high performers and leaders thrive on.",
+    "Students get access to real-world, high-impact projects through research labs, industry tie-ups, and team-based coursework.",
+    "Top U.S. campuses are startup-friendly environments, with incubators, funding access, and mentors helping students turn ideas into companies.",
+    "Programs like OPT and STEM extensions offer a legal path to work in the U.S. post-graduation, with higher chances of H1B sponsorship.",
+    "Diverse campuses offer global perspectives, improving communication, empathy, and adaptability—skills essential in today’s world."
+]
+topics_list = [""
+"1) Network of high performance students",
+"2) Strong Alumni of the college",
+"3) Getting Higher starting salary",
+"4) Mindset of high achiever",
+"5) Working on high value project",
+"6) Innovation Hubs and Startups",
+"7) Higher Chances US Visa",
+"8) Exposure to different cultures"
+]
+
+# Use method='label' (faster but single-line only):
+
+topic_clips = [TextClip(font="Bebas-Regular.ttf",
+                        text=tp,
+                        font_size=175,
+                        color='white', 
+                        method="label") for tp in topics_list]
+
+topic_clips[0] = topic_clips[0].with_position((45, 100))
+topic_clips[1] = topic_clips[1].with_position((45, 250))
+topic_clips[2] = topic_clips[2].with_position((45, 400))
+topic_clips[3] = topic_clips[3].with_position((45, 550))
+topic_clips[4] = topic_clips[4].with_position((45, 650))
+topic_clips[5] = topic_clips[5].with_position((45, 750))
+topic_clips[6] = topic_clips[6].with_position((45, 850))
+topic_clips[7] = topic_clips[7].with_position((45, 950))
+
+topic_clips[0] = topic_clips[0].with_start(5).with_end(bg_image.end)
+topic_clips[1] = topic_clips[1].with_start(17).with_end(bg_image.end)
+topic_clips[2] = topic_clips[2].with_start(29).with_end(bg_image.end)
+topic_clips[3] = topic_clips[3].with_start(41).with_end(bg_image.end)
+topic_clips[4] = topic_clips[4].with_start(53).with_end(bg_image.end)
+topic_clips[5] = topic_clips[5].with_start(65).with_end(bg_image.end)
+topic_clips[6] = topic_clips[6].with_start(77).with_end(bg_image.end)
+topic_clips[7] = topic_clips[7].with_start(89).with_end(bg_image.end)
+
+# print("Topic 1 start:", topic_clips[7].start)
+
+topic_clips[0] = topic_clips[0].with_effects([vfx.CrossFadeIn(1)])
+topic_clips[1] = topic_clips[1].with_effects([vfx.CrossFadeIn(1)])
+topic_clips[2] = topic_clips[2].with_effects([vfx.CrossFadeIn(1)])
+topic_clips[3] = topic_clips[3].with_effects([vfx.CrossFadeIn(1)])
+topic_clips[4] = topic_clips[4].with_effects([vfx.CrossFadeIn(1)])
+topic_clips[5] = topic_clips[5].with_effects([vfx.CrossFadeIn(1)])
+topic_clips[6] = topic_clips[6].with_effects([vfx.CrossFadeIn(1)])
+topic_clips[6] = topic_clips[6].with_effects([vfx.CrossFadeIn(1)])
+
+compo1 = CompositeVideoClip([bg_image, topic_clips[0],topic_clips[1],
+                             topic_clips[2],topic_clips[3],
+                             topic_clips[4],topic_clips[5],
+                             topic_clips[6],topic_clips[7]])
+
+
+
+topic_aud = AudioFileClip("topics.wav", fps=10)
+
+topic_aud.with_start(0)
+
+compo1.with_audio(topic_aud)
+
+compo1.write_videofile("comp1.mp4", fps=10)
@@ -0,0 +1,15 @@
+from moviepy import * # type: ignore
+ 
+txt = TextClip(font="Bebas-Regular.ttf", text="Hello", font_size=400, color="white")
+there = TextClip(font="Bebas-Regular.ttf", text="There", font_size=400, color="green")
+hru = TextClip(font="Bebas-Regular.ttf", text="How are you", font_size=400, color="green")
+
+txt = txt.with_duration(5).with_effects([vfx.SlideIn(1, "left")]).with_position((45, 100))
+there = there.with_duration(5).with_effects([vfx.SlideIn(1, "left")]).with_position((745, 100))
+hru = hru.with_duration(5).with_effects([vfx.SlideIn(1, "left")]).with_position((45, 500))
+
+bg = ImageClip("pjt_bg.png").with_duration(5)
+
+video = CompositeVideoClip([bg, txt, there, hru])
+
+video.write_videofile("simple.mp4", fps=5)
@@ -0,0 +1,15 @@
+from moviepy import * # type: ignore
+ 
+txt = TextClip(font="Bebas-Regular.ttf", text="Hello", font_size=140, color="white")
+there = TextClip(font="Bebas-Regular.ttf", text="There", font_size=140, color="yellow")
+hru = TextClip(font="Bebas-Regular.ttf", text="How are you", font_size=140, color="red")
+
+txt = txt.with_duration(5).with_effects([vfx.CrossFadeIn(1)]).with_position((45, 20))
+there = there.with_duration(5).with_effects([vfx.CrossFadeIn(1)]).with_position((345, 20))
+hru = hru.with_duration(5).with_effects([vfx.CrossFadeIn(1)]).with_position((45, 150))
+
+bg = VideoFileClip("registration.mp4")
+
+video = CompositeVideoClip([bg, txt, there, hru])
+
+video.write_videofile("simple_vid.mp4", fps=30)