VideoToASCII2/video_processor.py at main · AAARRRCCC/VideoToASCII2 · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
import subprocess
import os
import cv2
import sys
import multiprocessing
from concurrent.futures import ProcessPoolExecutor

class VideoProcessor:
    def __init__(self, num_processes=None):
        self._validate_ffmpeg()
        # Set default number of processes to CPU count if not specified
        self.num_processes = num_processes if num_processes is not None else os.cpu_count()

    def _validate_ffmpeg(self):
        """Validate that ffmpeg is installed and accessible."""
        try:
            # Use shell=True for Windows command execution
            subprocess.run('ffmpeg -version', check=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE, shell=True)
        except (subprocess.SubprocessError, FileNotFoundError):
            raise RuntimeError("ffmpeg is not installed or not accessible in PATH")

    def downscale_video(self, input_path, output_path, width, height):
        """
        Downscale the input video using ffmpeg while preserving aspect ratio.

        Args:
            input_path (str): Path to input video file
            output_path (str): Path to save downscaled video
            width (int): Target width
            height (int): Target height

        Returns:
            str: Path to downscaled video
            tuple: Actual dimensions (width, height) after preserving aspect ratio
        """
        # Ensure input file exists
        if not os.path.exists(input_path):
            raise FileNotFoundError(f"Input video file not found: {input_path}")

        # Get original video dimensions
        cap = cv2.VideoCapture(input_path)
        if not cap.isOpened():
            raise RuntimeError(f"Could not open video file: {input_path}")

        original_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
        original_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
        cap.release()

        # Calculate new dimensions that preserve aspect ratio
        original_aspect = original_width / original_height

        # If both width and height are specified, prioritize width for aspect ratio
        new_width = width
        new_height = int(new_width / original_aspect)

        # If calculated height exceeds specified height, recalculate based on height
        if new_height > height:
            new_height = height
            new_width = int(new_height * original_aspect)

        # Ensure dimensions are divisible by 2 for ffmpeg compatibility
        if new_width % 2 != 0:
            new_width -= 1
        if new_height % 2 != 0:
            new_height -= 1

        print(f"Original dimensions: {original_width}x{original_height}")
        print(f"New dimensions (preserving aspect ratio, adjusted for ffmpeg): {new_width}x{new_height}")

        # Create ffmpeg command for downscaling with Windows-safe quoting
        cmd = (
            f'ffmpeg -i "{input_path}" '
            f'-vf "scale={new_width}:{new_height}" '
            f'-c:v libx264 -crf 23 -preset fast -threads 0 -y "{output_path}"'
        )

        # Execute ffmpeg command
        try:
            # Use shell=True for Windows command execution
            process = subprocess.run(cmd, check=True, stderr=subprocess.PIPE, shell=True)
        except subprocess.CalledProcessError as e:
            error_message = e.stderr.decode() if e.stderr else str(e)
            raise RuntimeError(f"Error downscaling video: {error_message}")

        return output_path, (new_width, new_height)

    def extract_frames(self, video_path, batch_size=10):
        """
        Extract frames from the video as numpy arrays using parallel processing.

        Args:
            video_path (str): Path to video file
            batch_size (int): Number of frames to process in each batch

        Returns:
            list: List of frames as numpy arrays
            float: FPS of the video
        """
        if not os.path.exists(video_path):
            raise FileNotFoundError(f"Video file not found: {video_path}")

        cap = cv2.VideoCapture(video_path)
        if not cap.isOpened():
            raise RuntimeError(f"Could not open video file: {video_path}")

        fps = cap.get(cv2.CAP_PROP_FPS)
        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))

        # For parallel processing, we need to know frame positions
        frame_positions = []
        for i in range(total_frames):
            frame_positions.append(i)

        frames = [None] * total_frames  # Pre-allocate list to maintain frame order

        # Define a worker function to extract a batch of frames
        def extract_frame_batch(batch_positions, video_path):
            batch_frames = []
            cap = cv2.VideoCapture(video_path)

            for pos in batch_positions:
                cap.set(cv2.CAP_PROP_POS_FRAMES, pos)
                ret, frame = cap.read()
                if ret:
                    batch_frames.append((pos, frame))
                else:
                    batch_frames.append((pos, None))

            cap.release()
            return batch_frames

        # Process frames in parallel using batches
        with ProcessPoolExecutor(max_workers=self.num_processes) as executor:
            # Split frame positions into batches
            batches = []
            for i in range(0, len(frame_positions), batch_size):
                batch = frame_positions[i:i+batch_size]
                batches.append(batch)

            # Submit batches for parallel processing
            futures = []
            for batch in batches:
                future = executor.submit(extract_frame_batch, batch, video_path)
                futures.append(future)

            # Collect results while preserving order
            from tqdm import tqdm
            for future in tqdm(futures, desc="Extracting frame batches"):
                try:
                    batch_results = future.result()
                    for pos, frame in batch_results:
                        if frame is not None:
                            frames[pos] = frame
                except Exception as e:
                    print(f"Error extracting frames: {e}")

        # Remove any None frames (in case some frames couldn't be read)
        frames = [f for f in frames if f is not None]

        return frames, fps

    def create_comparison_video(self, input_path, ascii_path, output_path, scale_factor):
        """
        Create a side-by-side comparison video showing the original video and its ASCII version.

        Args:
            input_path (str): Path to the original input video
            ascii_path (str): Path to the ASCII converted video
            output_path (str): Path to save the side-by-side comparison video
            scale_factor (int): The scaling factor used for the ASCII video

        Returns:
            str: Path to the comparison video
        """
        # Ensure input files exist
        if not os.path.exists(input_path):
            raise FileNotFoundError(f"Original video file not found: {input_path}")
        if not os.path.exists(ascii_path):
            raise FileNotFoundError(f"ASCII video file not found: {ascii_path}")

        # Get original video dimensions
        original_cap = cv2.VideoCapture(input_path)
        if not original_cap.isOpened():
            raise RuntimeError(f"Could not open video file: {input_path}")
        original_width = int(original_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
        original_height = int(original_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
        original_cap.release()

        # Get ASCII video dimensions (for logging/info purposes)
        ascii_cap = cv2.VideoCapture(ascii_path)
        if not ascii_cap.isOpened():
            raise RuntimeError(f"Could not open video file: {ascii_path}")
        ascii_width = int(ascii_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
        ascii_height = int(ascii_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
        ascii_cap.release()

        print(f"Original video dimensions: {original_width}x{original_height}")
        print(f"ASCII video dimensions: {ascii_width}x{ascii_height}")

        # Calculate target dimensions for comparison based on original video and scale factor
        target_height = original_height * scale_factor
        original_aspect = original_width / original_height
        target_width = int(target_height * original_aspect)

        # Ensure target width is divisible by 2
        if target_width % 2 != 0:
            target_width -= 1

        print(f"Target dimensions for comparison videos: {target_width}x{target_height}")

        # Create the side-by-side comparison with ffmpeg
        # We resize both videos to the calculated target dimensions before stacking them
        # We maintain the audio from the original video

        cmd = (
            f'ffmpeg -i "{input_path}" -i "{ascii_path}" '
            f'-filter_complex "'
            f'[0:v]scale={target_width}:{target_height}[v0];'
            f'[1:v]scale={target_width}:{target_height}[v1];'
            f'[v0][v1]hstack=inputs=2[v]" '
            f'-map "[v]" -map 0:a? -c:v libx264 -crf 23 -preset fast -threads 0 '
            f'-c:a copy -y "{output_path}"'
        )

        try:
            # Use shell=True for Windows command execution
            process = subprocess.run(cmd, check=True, stderr=subprocess.PIPE, shell=True)
            print(f"Comparison video created successfully: {output_path}")
        except subprocess.CalledProcessError as e:
            error_message = e.stderr.decode() if e.stderr else str(e)
            raise RuntimeError(f"Error creating comparison video: {error_message}")

        return output_path

    def preprocess_to_bw(self, input_path, output_path):
        """
        Preprocess the input video to black and white using a specific FFmpeg filter chain.

        Args:
            input_path (str): Path to input video file
            output_path (str): Path to save the preprocessed video

        Returns:
            str: Path to the preprocessed video
        """
        # Ensure input file exists
        if not os.path.exists(input_path):
            raise FileNotFoundError(f"Input video file not found: {input_path}")

        # The specified FFmpeg filter chain
        # The specified FFmpeg filter chain - corrected quoting for Windows shell
        # The specified FFmpeg filter chain - corrected quoting for Windows shell
        filter_chain = "extractplanes=y,eq=contrast=1.8:gamma=0.8,histeq,scale=640:-1:flags=lanczos,lut=if(lt(val\,120)\,0\,255)"

        # Create ffmpeg command with the filter chain
        cmd = (
            f'ffmpeg -i "{input_path}" '
            f'-vf "{filter_chain}" '
            f'-c:v libx264 -crf 23 -preset fast -threads 0 -y "{output_path}"'
        )

        print(f"Applying preprocessing filter: {filter_chain}")

        # Execute ffmpeg command
        try:
            # Use shell=True for Windows command execution
            process = subprocess.run(cmd, check=True, stderr=subprocess.PIPE, shell=True)
            print(f"Preprocessing complete. Output saved to: {output_path}")
        except subprocess.CalledProcessError as e:
            error_message = e.stderr.decode() if e.stderr else str(e)
            raise RuntimeError(f"Error during preprocessing: {error_message}")

        return output_path