sync

Sleeping

App Files Files Community

sync / app.py

sheikhed

Update app.py

5ef29e5 verified 9 months ago

raw

history blame

6.13 kB

	import os
	import requests
	import json
	import time
	import subprocess
	import gradio as gr
	import uuid
	from dotenv import load_dotenv

	# Load environment variables
	load_dotenv()

	# API Keys
	B_KEY = os.getenv("B_KEY")

	# URLs
	API_URL = os.getenv("API_URL")
	UPLOAD_URL = os.getenv("UPLOAD_URL")

	def lipsync_api_call(video_url, audio_url):
	headers = {
	"Content-Type": "application/json",
	"x-api-key": B_KEY
	}

	data = {
	"audioUrl": audio_url,
	"videoUrl": video_url,
	"maxCredits": 1000,
	"model": "sync-1.6.0",
	"synergize": True,
	"pads": [0, 5, 0, 0],
	"synergizerStrength": 1
	}

	response = requests.post(API_URL, headers=headers, data=json.dumps(data))
	return response.json()

	def check_job_status(job_id):
	headers = {"x-api-key": B_KEY}
	max_attempts = 30 # Limit the number of attempts

	for _ in range(max_attempts):
	response = requests.get(f"{API_URL}/{job_id}", headers=headers)
	data = response.json()

	if data["status"] == "COMPLETED":
	return data["videoUrl"]
	elif data["status"] == "FAILED":
	return None

	time.sleep(10)
	return None

	def get_media_duration(file_path):
	# Fetch media duration using ffprobe
	cmd = ['ffprobe', '-v', 'error', '-show_entries', 'format=duration', '-of', 'default=noprint_wrappers=1:nokey=1', file_path]
	result = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
	return float(result.stdout.strip())

	def combine_audio_video(video_path, audio_path, output_path):
	# Get durations of both video and audio
	video_duration = get_media_duration(video_path)
	audio_duration = get_media_duration(audio_path)

	if video_duration > audio_duration:
	# Trim video to match the audio length
	cmd = [
	'ffmpeg', '-i', video_path, '-i', audio_path,
	'-t', str(audio_duration), # Trim video to audio duration
	'-map', '0:v', '-map', '1:a',
	'-c:v', 'copy', '-c:a', 'aac',
	'-y', output_path
	]
	else:
	# Loop video if it's shorter than audio
	loop_count = int(audio_duration // video_duration) + 1 # Calculate how many times to loop
	cmd = [
	'ffmpeg', '-stream_loop', str(loop_count), '-i', video_path, '-i', audio_path,
	'-t', str(audio_duration), # Match the duration of the final video with the audio
	'-map', '0:v', '-map', '1:a',
	'-c:v', 'copy', '-c:a', 'aac',
	'-shortest', '-y', output_path
	]

	subprocess.run(cmd, check=True)

	def process_video(video_url, audio_url, progress=gr.Progress()):
	if not audio_url:
	return None, "No audio URL provided"
	if not video_url:
	return None, "No video URL provided"

	session_id = str(uuid.uuid4()) # Generate a unique session ID

	progress(0.2, desc="Processing video...")

	try:
	progress(0.4, desc="Initiating lipsync...")
	job_data = lipsync_api_call(video_url, audio_url)

	if "error" in job_data or "message" in job_data:
	raise Exception(job_data.get("error", job_data.get("message", "Unknown error")))

	job_id = job_data["id"]

	progress(0.5, desc="Processing lipsync...")
	result_url = check_job_status(job_id)

	if result_url:
	progress(0.9, desc="Downloading result...")
	response = requests.get(result_url)
	output_path = f"output_{session_id}.mp4"
	with open(output_path, "wb") as f:
	f.write(response.content)
	progress(1.0, desc="Complete!")
	return output_path, "Lipsync completed successfully!"
	else:
	raise Exception("Lipsync processing failed or timed out")

	except Exception as e:
	progress(0.8, desc="Falling back to simple combination...")
	try:
	# Download the video from the URL
	video_response = requests.get(video_url)
	temp_video_path = f"temp_video_{session_id}.mp4"
	with open(temp_video_path, "wb") as f:
	f.write(video_response.content)

	# Download the audio from the URL
	audio_response = requests.get(audio_url)
	temp_audio_path = f"temp_audio_{session_id}.mp3"
	with open(temp_audio_path, "wb") as f:
	f.write(audio_response.content)

	output_path = f"output_{session_id}.mp4"
	combine_audio_video(temp_video_path, temp_audio_path, output_path)

	# Clean up temporary files
	os.remove(temp_video_path)
	os.remove(temp_audio_path)

	progress(1.0, desc="Complete!")
	return output_path, f"Used fallback method. Original error: {str(e)}"
	except Exception as fallback_error:
	return None, f"All methods failed. Error: {str(fallback_error)}"

	def create_interface():
	with gr.Blocks() as app:
	gr.Markdown("# Video Lip Sync")
	with gr.Row():
	with gr.Column():
	video_url_input = gr.Textbox(label="Video URL")
	audio_url_input = gr.Textbox(label="Audio URL")
	generate_btn = gr.Button("Generate Video")
	with gr.Column():
	video_output = gr.Video(label="Generated Video")
	status_output = gr.Textbox(label="Status", interactive=False)

	def on_generate(video_url, audio_url):
	if not audio_url:
	return None, "Please provide an audio URL."
	if not video_url:
	return None, "Please provide a video URL."
	return process_video(video_url, audio_url)

	generate_btn.click(
	fn=on_generate,
	inputs=[video_url_input, audio_url_input],
	outputs=[video_output, status_output]
	)

	return app

	if __name__ == "__main__":
	app = create_interface()
	app.launch()