Media_Utilities / Video_combiner_updated-.py
RO-Rtechs's picture
Upload 5 files
f4877bc verified
import gradio as gr
import subprocess
import os
from tqdm import tqdm
import time
from PIL import Image
from concurrent.futures import ThreadPoolExecutor
import torch
def get_device():
if torch.cuda.is_available():
return torch.device('cuda')
else:
return torch.device('cpu')
device = get_device()
print(f"Using device: {device}")
def get_unique_filename(base_name, extension):
counter = 1
if not base_name.endswith(extension):
unique_name = f"{base_name}{extension}"
else:
unique_name = base_name
while os.path.exists(unique_name):
unique_name = f"{base_name}_{counter}{extension}"
counter += 1
return unique_name
def get_temp_task_path(input_video_path, task_name):
# Extract the base name of the input video file
base_name = os.path.basename(input_video_path)
print(f"Base name: {base_name}") # Debug print
# Split the base name into words and trim the first 4 words
words = base_name.split()
if len(words) > 4:
trimmed_name = '_'.join(words[4:])
else:
trimmed_name = base_name # If there are less than 4 words, use the base name as is
print(f"Trimmed name: {trimmed_name}") # Debug print
# Create the new folder name
folder_name = f"{task_name}_{trimmed_name}"
print(f"Folder name: {folder_name}") # Debug print
# Get the directory of the input video file
input_dir = os.path.dirname(input_video_path)
print(f"Input directory: {input_dir}") # Debug print
# Create the full path for the temporary task folder
temp_task_path = os.path.join(input_dir, folder_name)
print(f"Temporary task path: {temp_task_path}") # Debug print
# Create the directory if it doesn't exist
os.makedirs(temp_task_path, exist_ok=True)
print(f"Directory created: {temp_task_path}") # Debug print
return temp_task_path
def combine_videos(video_files, task_name):
if not video_files:
return "No video files selected.", None
# Assuming the first video file is representative for the path
input_dir = os.path.dirname(video_files[0])
# Use the input directory as the output directory
output_file = os.path.join(input_dir, get_unique_filename("combined_video", ".mp4"))
filelist_path = os.path.join(input_dir, "filelist.txt")
with open(filelist_path, "w") as filelist:
for video in video_files:
video_path = os.path.abspath(video).replace('\\', '/')
filelist.write(f"file '{video_path}'\n")
command = [
"ffmpeg", "-f", "concat", "-safe", "0", "-i", filelist_path,
"-c", "copy", output_file
]
with ThreadPoolExecutor() as executor:
future = executor.submit(subprocess.run, command, text=True, capture_output=True)
result = future.result() # Waits for the command to complete and returns the result
if result.returncode == 0:
return f"Videos combined successfully into {output_file}", output_file
else:
return f"Error combining videos: {result.stderr}", None
def combine_audios(audio_files):
if not audio_files:
return "No audio files selected.", None
output_file = get_unique_filename("combined_audio", ".mp3")
filelist_path = os.path.abspath("filelist.txt")
with open(filelist_path, "w") as filelist:
for audio in audio_files:
filelist.write(f"file '{os.path.abspath(audio).replace('\\', '/')}'\n")
command = [
"ffmpeg", "-f", "concat", "-safe", "0", "-i", filelist_path,
"-c", "copy", output_file
]
with ThreadPoolExecutor() as executor:
future = executor.submit(subprocess.run, command, text=True, capture_output=True)
result = future.result() # Waits for the command to complete and returns the result
if result.returncode == 0:
return f"Audios combined successfully into {output_file}", output_file
else:
return f"Error combining audios: {result.stderr}", None
def combine_images(image_files):
if not image_files:
return "No image files selected.", None
output_file = get_unique_filename("combined_image", ".mp4")
command = ["convert"] + image_files + [output_file]
process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
total_time = 0
with tqdm(total=100, desc="Combining Images") as pbar:
while True:
output = process.stderr.readline()
if output == '' and process.poll() is not None:
break
if output:
total_time += 1
pbar.update(1)
time.sleep(0.1)
return f"Images combined successfully into {output_file}", output_file
def split_video(input_file, chunk_size):
input_dir = os.path.dirname(input_file)
base_name = os.path.splitext(os.path.basename(input_file))[0]
chunk_files = []
command = [
"ffmpeg", "-i", input_file, "-c", "copy", "-map", "0", "-segment_time", str(chunk_size),
"-f", "segment", os.path.join(input_dir, f"{base_name}_chunk_%03d.mp4")
]
subprocess.run(command, check=True)
for file in os.listdir(input_dir):
if file.startswith(base_name) and file.endswith(".mp4") and "chunk" in file:
chunk_files.append(os.path.join(input_dir, file))
return chunk_files
def adjust_speed_chunked(media_file, speed, chunk_size=60):
if not media_file:
return "No media file selected.", None
chunk_files = split_video(media_file, chunk_size)
processed_files = []
def process_chunk(chunk_file):
output_file = get_unique_filename(f"adjusted_speed_{os.path.basename(chunk_file)}", ".mp4")
codec = get_gpu_codec() or "libx264"
command = [
"ffmpeg", "-hwaccel", "auto", "-i", chunk_file, "-filter:v", f"setpts={1/speed}*PTS",
"-filter:a", f"atempo={speed}", "-c:v", codec, "-preset", "fast", output_file
]
subprocess.run(command, check=True)
return output_file
with ThreadPoolExecutor() as executor:
futures = [executor.submit(process_chunk, chunk) for chunk in chunk_files]
for future in futures:
processed_files.append(future.result())
combined_output_file = os.path.join(os.path.dirname(media_file), get_unique_filename("adjusted_speed_combined", ".mp4"))
with open("filelist.txt", "w") as filelist:
for processed_file in processed_files:
filelist.write(f"file '{processed_file}'\n")
command = [
"ffmpeg", "-f", "concat", "-safe", "0", "-i", "filelist.txt",
"-c", "copy", combined_output_file
]
subprocess.run(command, check=True)
return f"Speed adjusted successfully to {speed}x in {combined_output_file}", combined_output_file
def adjust_speed(media_file, speed):
if not media_file:
return "No media file selected.", None
output_file = get_unique_filename(f"adjusted_speed_{os.path.basename(media_file)}", ".mp4")
# Determine the codec based on available hardware
codec = get_gpu_codec()
if not codec:
codec = "libx264" # Fallback to a widely supported software codec
command = [
"ffmpeg", "-hwaccel", "auto", "-i", media_file, "-filter:v", f"setpts={1/speed}*PTS",
"-filter:a", f"atempo={speed}", "-c:v", codec, "-preset", "fast", output_file
]
process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
total_time = 0
with tqdm(total=100, desc="Adjusting Speed") as pbar:
while True:
output = process.stderr.readline()
if output == '' and process.poll() is not None:
break
if output:
total_time += 1
pbar.update(1)
time.sleep(0.1)
return f"Speed adjusted successfully to {speed}x in {output_file}", output_file
def adjust_speed_by_length(media_file, desired_length_hhmmss):
if not media_file:
return "No media file selected.", None
original_length = get_media_length(media_file)
desired_length = hhmmss_to_seconds(desired_length_hhmmss)
speed = original_length / desired_length
return adjust_speed(media_file, speed)
def adjust_speed_combined(media_file, speed, hours, minutes, seconds, adjust_speed_checkbox, compress_checkbox):
if not adjust_speed_checkbox and not compress_checkbox:
return "Error: At least one of 'Adjust Speed' or 'Compress Video' must be checked.", None
output_file = media_file
output_message = ""
if adjust_speed_checkbox:
if hours or minutes or seconds:
desired_length = f"{int(hours):02}:{int(minutes):02}:{int(seconds):02}"
output_message, output_file = adjust_speed_by_length(media_file, desired_length)
else:
output_message, output_file = adjust_speed_chunked(media_file, speed)
if compress_checkbox and output_file:
compressed_output_file = get_unique_filename(f"compressed_{os.path.basename(output_file)}", ".mp4")
compress_message, output_file = compress_video(output_file, compressed_output_file)
output_message = f"{output_message} and {compress_message}"
return output_message, output_file
def hhmmss_to_seconds(hhmmss):
h, m, s = map(int, hhmmss.split(':'))
return h * 3600 + m * 60 + s
def get_media_length(media_file):
result = subprocess.run(
["ffprobe", "-v", "error", "-show_entries", "format=duration", "-of", "default=noprint_wrappers=1:nokey=1", media_file],
stdout=subprocess.PIPE,
stderr=subprocess.STDOUT
)
return float(result.stdout)
def auto_color_correct(video_file):
if not video_file:
return "No video file selected.", None
input_dir = os.path.dirname(video_file)
output_file = os.path.join(input_dir, get_unique_filename(f"color_corrected_{os.path.basename(video_file)}", ""))
command = [
"ffmpeg", "-i", video_file, "-vf", "eq=brightness=0.06:saturation=1.5", output_file
]
subprocess.run(command, check=True)
return f"Auto color correction applied successfully to {output_file}", output_file
def extract_audio(video_file):
if not video_file:
return "No video file selected.", None
output_file = get_unique_filename(f"extracted_audio_{os.path.basename(video_file)}", ".mka")
command = [
"ffmpeg", "-i", video_file, "-vn", "-acodec", "copy", output_file
]
try:
subprocess.run(command, check=True)
except subprocess.CalledProcessError as e:
return f"Error extracting audio: {e}. Command: {' '.join(command)}", None
return f"Audio extracted successfully into {output_file}", output_file
def compress_video(input_file, output_file):
codec = get_gpu_codec()
if not codec:
print("No supported GPU codec found. Falling back to software encoding.")
codec = "libx264" # Fallback to a widely supported software codec
# Adjust these parameters based on your specific needs
bitrate = "1M" # Lower bitrate for smaller file size
maxrate = "1.2M" # Max bitrate to limit peaks in bitrate
bufsize = "2M" # Buffer size for bitrate control
preset = "fast" # Faster preset for quicker compression
command = [
"ffmpeg", "-hwaccel", "auto", "-i", input_file,
"-c:v", codec,
"-preset", preset,
"-b:v", bitrate,
"-maxrate", maxrate,
"-bufsize", bufsize,
"-profile:v", "high",
"-level", "4.1",
output_file
]
try:
subprocess.run(command, check=True)
return f"Video compressed successfully into {output_file}", output_file
except subprocess.CalledProcessError as e:
return f"Error compressing video: {e}", None
def add_watermark(video_file, watermark_type, watermark_text, watermark_image, opacity, position_x, position_y, font_size, font_color):
if not video_file:
return "No video file selected.", None
output_file = get_unique_filename(f"watermarked_{os.path.basename(video_file)}", ".mp4")
drawtext = f"drawtext=text='{watermark_text}':x={position_x}:y={position_y}:fontsize={font_size}:fontcolor={font_color}@{opacity}" if watermark_type == "text" else ""
overlay = f"overlay={position_x}:{position_y}" if watermark_type == "image" else ""
command = [
"ffmpeg", "-i", video_file,
"-vf", f"{drawtext if watermark_type == 'text' else ''}{overlay if watermark_type == 'image' else ''}",
output_file
]
process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
total_time = 0
with tqdm(total=100, desc="Adding Watermark") as pbar:
while True:
output = process.stderr.readline()
if output == '' and process.poll() is not None:
break
if output:
total_time += 1
pbar.update(1)
time.sleep(0.1)
return f"Watermark added successfully to {output_file}", output_file
def compress_image(input_image):
if not input_image:
return "No image file selected.", None
output_file = get_unique_filename(f"compressed_{os.path.basename(input_image)}", ".jpg")
with Image.open(input_image) as img:
img.save(output_file, "JPEG", quality=95) # Adjust quality as needed
return f"Image compressed successfully into {output_file}", output_file
def compress_image_lossless(input_image):
if not input_image:
return "No image file selected.", None
output_file = get_unique_filename(f"compressed_lossless_{os.path.basename(input_image)}", ".png")
with Image.open(input_image) as img:
img.save(output_file, "PNG", optimize=True) # PNG is lossless
return f"Image compressed losslessly into {output_file}", output_file
def mp3_to_video(mp3_file, image_file):
if not mp3_file or not image_file:
return "MP3 file or image file not selected.", None
output_file = get_unique_filename(f"{os.path.splitext(os.path.basename(mp3_file))[0]}", ".mp4")
command = [
"ffmpeg", "-loop", "1", "-i", image_file, "-i", mp3_file, "-c:v", "libx264", "-c:a", "aac", "-b:a", "192k", "-shortest", output_file
]
subprocess.run(command, check=True)
return f"MP3 converted to video successfully into {output_file}", output_file
def video_to_mp3(video_file):
if not video_file:
return "No video file selected.", None
output_file = get_unique_filename(f"{os.path.splitext(os.path.basename(video_file))[0]}", ".mp3")
command = [
"ffmpeg", "-i", video_file, "-q:a", "0", "-map", "a", output_file
]
subprocess.run(command, check=True)
return f"Video converted to MP3 successfully into {output_file}", output_file
def convert_image_format(input_image, output_format):
if not input_image:
return "No image file selected.", None
output_file = get_unique_filename(f"{os.path.splitext(os.path.basename(input_image))[0]}", f".{output_format}")
with Image.open(input_image) as img:
img.save(output_file, output_format.upper())
return f"Image converted to {output_format} format successfully into {output_file}", output_file
def get_gpu_codec():
# Prioritize Intel QSV codecs for Intel GPUs
codecs = ["h264_qsv", "hevc_qsv", "mpeg2_qsv"]
# Use the -encoders flag to get a list of all available encoders
result = subprocess.run(["ffmpeg", "-hide_banner", "-encoders"], capture_output=True, text=True)
available_encoders = result.stdout
print("Available encoders:", available_encoders) # Debug: print available encoders
for codec in codecs:
# Check if each codec is in the list of available encoders
if codec in available_encoders:
print(f"Using GPU codec: {codec}") # Debug: confirm which codec is used
return codec
print("No supported GPU codec found.")
return None
def interface():
with gr.Blocks() as demo:
gr.Markdown("### Media Combiner Tool")
with gr.Tab("Combine Videos"):
with gr.Row():
video_files = gr.File(label="Select Video Files", type="filepath", file_count="multiple")
task_name = gr.Textbox(label="Task Name")
video_submit = gr.Button("Combine Videos")
video_output = gr.Textbox(label="Output")
video_download = gr.File(label="Download Combined Video")
video_submit.click(combine_videos, inputs=[video_files, task_name], outputs=[video_output, video_download])
with gr.Tab("Combine Audios"):
with gr.Row():
audio_files = gr.File(label="Select Audio Files", type="filepath", file_count="multiple")
audio_submit = gr.Button("Combine Audios")
audio_output = gr.Textbox(label="Output")
audio_download = gr.File(label="Download Combined Audio")
audio_submit.click(combine_audios, inputs=[audio_files], outputs=[audio_output, audio_download])
with gr.Tab("Combine Images"):
with gr.Row():
image_files = gr.File(label="Select Image Files", type="filepath", file_count="multiple")
image_submit = gr.Button("Combine Images")
image_output = gr.Textbox(label="Output")
image_download = gr.File(label="Download Combined Image")
image_submit.click(combine_images, inputs=[image_files], outputs=[image_output, image_download])
with gr.Tab("Adjust Speed"):
with gr.Row():
media_file = gr.File(label="Select Media File", type="filepath")
speed = gr.Slider(label="Speed", minimum=0.5, maximum=2.0, step=0.1, value=1.0)
with gr.Row():
hours = gr.Number(label="Hours", value=0, precision=0)
minutes = gr.Number(label="Minutes", value=0, precision=0)
seconds = gr.Number(label="Seconds", value=0, precision=0)
with gr.Row():
adjust_speed_checkbox = gr.Checkbox(label="Adjust Speed", value=True)
compress_checkbox = gr.Checkbox(label="Compress Video", value=False)
speed_submit = gr.Button("Submit")
speed_output = gr.Textbox(label="Output")
speed_download = gr.File(label="Download Adjusted Media")
speed_submit.click(adjust_speed_combined, inputs=[media_file, speed, hours, minutes, seconds, adjust_speed_checkbox, compress_checkbox], outputs=[speed_output, speed_download])
with gr.Tab("Auto Color Correction"):
with gr.Row():
video_file = gr.File(label="Select Video File", type="filepath")
color_submit = gr.Button("Apply Color Correction")
color_output = gr.Textbox(label="Output")
color_download = gr.File(label="Download Color Corrected Video")
color_submit.click(auto_color_correct, inputs=[video_file], outputs=[color_output, color_download])
with gr.Tab("Extract Audio"):
with gr.Row():
video_file = gr.File(label="Select Video File", type="filepath")
extract_submit = gr.Button("Extract Audio")
extract_output = gr.Textbox(label="Output")
extract_download = gr.File(label="Download Extracted Audio")
extract_submit.click(extract_audio, inputs=[video_file], outputs=[extract_output, extract_download])
with gr.Tab("Add Watermark"):
with gr.Row():
video_file = gr.File(label="Select Video File", type="filepath")
watermark_type = gr.Radio(label="Watermark Type", choices=["text", "image"], value="text")
with gr.Row():
watermark_text = gr.Textbox(label="Watermark Text", visible=True)
watermark_image = gr.File(label="Watermark Image", type="filepath", visible=False)
with gr.Row():
opacity = gr.Slider(label="Opacity", minimum=0.0, maximum=1.0, step=0.1, value=1.0)
position_x = gr.Slider(label="Position X", minimum=0, maximum=1920, step=1, value=0)
position_y = gr.Slider(label="Position Y", minimum=0, maximum=1080, step=1, value=0)
with gr.Row():
font_size = gr.Slider(label="Font Size", minimum=10, maximum=100, step=1, value=24, visible=True)
font_color = gr.ColorPicker(label="Font Color", value="#FFFFFF", visible=True)
watermark_submit = gr.Button("Add Watermark")
watermark_output = gr.Textbox(label="Output")
watermark_download = gr.File(label="Download Watermarked Video")
def update_visibility(watermark_type):
return {
watermark_text: gr.update(visible=watermark_type == "text"),
watermark_image: gr.update(visible=watermark_type == "image"),
font_size: gr.update(visible=watermark_type == "text"),
font_color: gr.update(visible=watermark_type == "text")
}
watermark_type.change(update_visibility, inputs=[watermark_type], outputs=[watermark_text, watermark_image, font_size, font_color])
watermark_submit.click(add_watermark, inputs=[video_file, watermark_type, watermark_text, watermark_image, opacity, position_x, position_y, font_size, font_color], outputs=[watermark_output, watermark_download])
with gr.Tab("Compress Image Losslessly"):
with gr.Row():
image_file = gr.File(label="Select Image File", type="filepath")
compress_submit = gr.Button("Compress Image Losslessly")
compress_output = gr.Textbox(label="Output")
compress_download = gr.File(label="Download Compressed Image")
compress_submit.click(compress_image_lossless, inputs=[image_file], outputs=[compress_output, compress_download])
with gr.Tab("Convert MP3 to Video"):
with gr.Row():
mp3_file = gr.File(label="Select MP3 File", type="filepath")
image_file = gr.File(label="Select Image File", type="filepath")
convert_submit = gr.Button("Convert MP3 to Video")
convert_output = gr.Textbox(label="Output")
convert_download = gr.File(label="Download Converted Video")
convert_submit.click(mp3_to_video, inputs=[mp3_file, image_file], outputs=[convert_output, convert_download])
with gr.Tab("Convert Video to MP3"):
with gr.Row():
video_file = gr.File(label="Select Video File", type="filepath")
convert_submit = gr.Button("Convert Video to MP3")
convert_output = gr.Textbox(label="Output")
convert_download = gr.File(label="Download Converted MP3")
convert_submit.click(video_to_mp3, inputs=[video_file], outputs=[convert_output, convert_download])
return demo
if __name__ == "__main__":
demo = interface()
demo.launch(share=True)