From d4725846fda2cd4d3bd76180bd9ef91d8986e6fd Mon Sep 17 00:00:00 2001
From: sakamoto <sakamoto@sakamoto.dev>
Date: Fri, 2 Aug 2024 09:35:00 -0500
Subject: [PATCH] =?UTF-8?q?=F0=9F=8E=89=20init?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .gitignore       |   2 +
 README.md        |   0
 requirements.txt |   0
 vid2sheet.py     | 280 +++++++++++++++++++++++++++++++++++++++++++++++
 4 files changed, 282 insertions(+)
 create mode 100644 .gitignore
 create mode 100644 README.md
 create mode 100644 requirements.txt
 create mode 100644 vid2sheet.py

diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..790e1cf
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,2 @@
+.venv/
+test/
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..e69de29
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000..e69de29
diff --git a/vid2sheet.py b/vid2sheet.py
new file mode 100644
index 0000000..fbfb604
--- /dev/null
+++ b/vid2sheet.py
@@ -0,0 +1,280 @@
+import cv2
+import numpy as np
+import os
+import re
+import img2pdf
+import tempfile
+import yt_dlp
+import argparse
+
+from PIL import Image
+from tqdm import tqdm
+
+# test
+# https://www.youtube.com/watch?v=tyloC0e-Tqk
+# ./
+
+# this is so overengineered that the bloat takes up 1/4 of the line
+
+parser = argparse.ArgumentParser(
+    description="Converts Video static images based on significant frame changes to sheet music in a form of .pdf file.",
+    formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+)
+
+parser.add_argument("source", type=str, help="source of the file or a YouTube link")
+parser.add_argument("destination", type=str, help="destination of the output file")
+
+parser.add_argument("-v", "--verbose", action="store_true", help="enable debug mode")
+
+args = parser.parse_args()
+
+src = args.source
+dest = args.destination
+verbose = args.verbose
+
+print(f"[INFO] The source file is: {src}")
+print(f"[INFO] The destination file is: {dest}")
+print("[INFO] Verbose enabled") if verbose is True else None
+
+
+class Vid2Sheet:
+    def __init__(self, src, dest, intro_start: int = 0):
+        self.src = src
+        self.dest = dest
+
+        self.temp_dir = tempfile.TemporaryDirectory()
+        self.output_dir = self.temp_dir.name
+        self.final = os.path.join(self.output_dir, "final")
+        self.vid_folder = os.path.join(self.output_dir, "vid")
+        self.video_title = None
+
+        os.makedirs(self.final, exist_ok=True)
+        os.makedirs(self.vid_folder, exist_ok=True)
+        os.makedirs(self.dest, exist_ok=True)
+
+        if self.installation():
+            print("[INFO] Finished downloading")
+            all_entries = os.listdir(self.vid_folder)
+            files = [
+                entry
+                for entry in all_entries
+                if os.path.isfile(os.path.join(self.vid_folder, entry))
+            ]
+            print(f"[INFO] Found a video {files}, in {self.vid_folder}")
+
+            if files:
+                self.cap = cv2.VideoCapture(os.path.join(self.vid_folder, files[0]))
+            else:
+                print("[ERR] No files found in the directory.")
+                exit()
+        else:
+            self.cap = cv2.VideoCapture(self.src)
+            # Extract the filename without extension as a default title
+            self.video_title = os.path.splitext(os.path.basename(self.src))[0]
+
+        if not self.cap.isOpened():
+            print("[ERR] Could not open video.")
+            exit()
+
+        self.frame_count = intro_start
+        self.extracted_count = 0
+        self.previous_frame = None
+
+        self.total_frames = int(self.cap.get(cv2.CAP_PROP_FRAME_COUNT))
+        (
+            print(f"[DEBUG] Total number of frames in the video: {self.total_frames}")
+            if verbose is True
+            else None
+        )
+        self.pbar_count = 0
+        self.pbar = tqdm(total=self.total_frames)
+
+    def installation(self):
+        youtube_pattern = re.compile(
+            r"(https?://)?(www\.)?"
+            r"(youtube\.com/watch\?v=|youtu\.be/)"
+            r"[a-zA-Z0-9_-]{11}",
+            re.IGNORECASE,
+        )
+        if re.match(youtube_pattern, self.src):
+            print("[INFO] Detected YouTube link")
+            ydl_opts = {
+                "outtmpl": f"{self.vid_folder}/%(title)s.%(ext)s",
+                "quiet": True,  # Suppress output
+                "progress_hooks": [self._hook],
+            }
+            print("[INFO] Attempting to start download...")
+            try:
+                with yt_dlp.YoutubeDL(ydl_opts) as ydl:
+                    ydl.download([self.src])
+                return True
+            except Exception as e:
+                print(f"[ERR] An error occurred: {e}")
+                return False
+
+    def _hook(self, d):
+        if d["status"] == "finished":
+            self.video_title = d.get("info_dict", {}).get("title", "unknown_title")
+
+    def analyze_frame(self, change_threshold=12500000):
+        while True:
+            ret, current_frame = self.cap.read()
+            if not ret:
+                break
+
+            self.gray_current = cv2.cvtColor(current_frame, cv2.COLOR_BGR2GRAY)
+
+            if self.previous_frame is None:
+                image_path = os.path.join(
+                    self.output_dir, f"image_{self.extracted_count:03}.jpg"
+                )
+                cv2.imwrite(image_path, current_frame)
+                self.extracted_count += 1
+                (
+                    self.pbar.set_description(
+                        f"[DEBUG] Start at Frame {self.frame_count}, saved as {image_path}"
+                    ) if verbose is True else self.pbar.set_description("[INFO] Analyzing video...")
+                )
+
+            else:
+                frame_diff = cv2.absdiff(self.previous_frame, self.gray_current)
+                diff_sum = np.sum(frame_diff)
+
+                if diff_sum > change_threshold:
+                    image_path = os.path.join(
+                        self.output_dir, f"image_{self.extracted_count:03}.jpg"
+                    )
+                    cv2.imwrite(image_path, current_frame)
+                    self.pbar.set_description(
+                        f"[DEBUG] Frame {self.frame_count} changed significantly, saved as {image_path}"
+                    ) if verbose is True else None
+                    self.extracted_count += 1
+
+            self.previous_frame = self.gray_current
+            self.frame_count += 1
+
+            self.pbar_count += 1
+            self.pbar.update()
+
+        self.cap.release()
+
+    def create_blank_image(self, width, height):
+        return Image.new("RGB", (width, height), "white")
+
+    def combine_imgs(self, image_1, image_2, dest, mode="vertical"):
+        if isinstance(image_1, str):
+            image_1 = Image.open(image_1)
+        if isinstance(image_2, str):
+            image_2 = Image.open(image_2)
+
+        width_1, height_1 = image_1.size
+        width_2, height_2 = image_2.size
+
+        if mode == "horizontal":
+            total_width = width_1 + width_2
+            max_height = max(height_1, height_2)
+            combined_image = Image.new("RGB", (total_width, max_height))
+            combined_image.paste(image_1, (0, 0))
+            combined_image.paste(image_2, (width_1, 0))
+
+        elif mode == "vertical":
+            max_width = max(width_1, width_2)
+            total_height = height_1 + height_2
+            combined_image = Image.new("RGB", (max_width, total_height))
+            combined_image.paste(image_1, (0, 0))
+            combined_image.paste(image_2, (0, height_1))
+
+        else:
+            raise ValueError("[ERR] Mode must be either 'vertical' or 'horizontal'.")
+
+        combined_image.save(dest)
+
+    def combine_in_pairs(self):
+        all_files = os.listdir(self.output_dir)
+        non_hidden_files = [f for f in all_files if not f.startswith(".")]
+        images = [
+            f
+            for f in non_hidden_files
+            if os.path.isfile(os.path.join(self.output_dir, f))
+        ]
+        images.sort(key=natural_keys)
+
+        if len(images) % 2 != 0:
+            last_image = images.pop()
+        else:
+            last_image = None
+
+        for img in range(0, len(images), 2):
+            image_1 = os.path.join(self.output_dir, images[img])
+            image_2 = os.path.join(self.output_dir, images[img + 1])
+            output_filename = f"combined_{img//2 + 1:03}.jpg"
+            output_path = os.path.join(self.final, output_filename)
+            self.combine_imgs(image_1, image_2, output_path, mode="vertical")
+
+        if last_image:
+            last_image_path = os.path.join(self.output_dir, last_image)
+            last_image_img = Image.open(last_image_path)
+            width, height = last_image_img.size
+            blank_image = self.create_blank_image(width, height)
+
+            blank_image_path = os.path.join(self.output_dir, "blank_image.jpg")
+            blank_image.save(blank_image_path)
+
+            output_filename = f"combined_{len(images)//2 + 1:03}.jpg"
+            output_path = os.path.join(self.final, output_filename)
+            self.combine_imgs(
+                last_image_path, blank_image_path, output_path, mode="vertical"
+            )
+
+            os.remove(blank_image_path)
+
+        self.pbar_count += 1
+        self.pbar.update()
+
+    def run(self):
+        self.analyze_frame()
+        self.combine_in_pairs()
+        self.convert_to_pdf()
+
+    def scan_folder(self, src):
+        files_in_folder = []
+
+        for root, dirs, files in os.walk(src):
+            for name in files:
+                if name.endswith((".png", ".jpg", ".jpeg", ".mp4", ".webm")):
+                    files_in_folder.append(os.path.join(root, name))
+
+        files_in_folder.sort(key=natural_keys)
+        return files_in_folder
+
+    def convert_to_pdf(self):
+        imgs = self.scan_folder(self.final)
+        if not imgs:
+            print("[ERR] No images found for PDF conversion.")
+            return
+
+        file_name = self.video_title if self.video_title else "output"
+        pdf_path = os.path.join(self.dest, f"{file_name}.pdf")
+
+        with open(pdf_path, "wb") as f:
+            f.write(img2pdf.convert(imgs))
+
+        self.pbar.set_description(f"[INFO] Saved file to {pdf_path}")
+        self.pbar_count += 1
+        self.pbar.update()
+
+    def __del__(self):
+        self.temp_dir.cleanup()
+
+
+def atoi(text):
+    return int(text) if text.isdigit() else text
+
+
+def natural_keys(text):
+    return [atoi(c) for c in re.split(r"(\d+)", text)]
+
+
+if __name__ == "__main__":
+    program = Vid2Sheet(src, dest)
+    program.run()