Spaces:

metek7
/

instagram-short-summarizing

Runtime error

App Files Files Community

instagram-short-summarizing / app.py

metek7

Update app.py

3b421e3 verified 11 months ago

raw

history blame

2.7 kB

	import sys
	import subprocess
	import pkg_resources

	required_packages = {
	'torch': 'torch',
	'gradio': 'gradio',
	'transformers': 'transformers',
	'decord': 'decord',
	'numpy': 'numpy'
	}

	def install_packages(packages):
	for package in packages:
	subprocess.check_call([sys.executable, "-m", "pip", "install", package])

	def check_and_install_packages():
	installed_packages = {pkg.key for pkg in pkg_resources.working_set}
	missing_packages = [required_packages[pkg] for pkg in required_packages if pkg not in installed_packages]

	if missing_packages:
	print("Installing missing packages...")
	install_packages(missing_packages)
	print("Packages installed successfully.")
	else:
	print("All required packages are already installed.")

	# Check and install required packages
	check_and_install_packages()

	# Now import the required modules
	import gradio as gr
	import torch
	from transformers import AutoTokenizer, AutoModelForCausalLM
	from decord import VideoReader, cpu
	import numpy as np

	# Define a simple video processing function (placeholder for LLaVA-Video)
	def process_video(video_path, max_frames=64):
	vr = VideoReader(video_path, ctx=cpu(0))
	total_frames = len(vr)
	frame_indices = np.linspace(0, total_frames - 1, max_frames, dtype=int)
	frames = vr.get_batch(frame_indices).asnumpy()
	return frames

	# Define a simple text generation function (placeholder for actual model)
	def generate_response(video_frames, question):
	# This is a placeholder. In reality, you'd use the LLaVA-Video model here.
	return f"Analyzed {len(video_frames)} frames. Your question was: {question}"

	def analyze_instagram_short(video_file, question):
	if video_file is None:
	return "Please upload an Instagram short video."

	video_frames = process_video(video_file)
	response = generate_response(video_frames, question)
	return response

	# Create Gradio interface
	with gr.Blocks() as demo:
	gr.Markdown("# 🎥 Instagram Short Video Analyzer")
	gr.Markdown("Upload your Instagram short video and ask questions about its content!")

	with gr.Row():
	with gr.Column():
	video_input = gr.Video(label="Upload Instagram Short Video")
	question_input = gr.Textbox(label="Ask a question about the video", placeholder="What's happening in this Instagram short?")
	submit_button = gr.Button("Analyze Short Video")
	output = gr.Textbox(label="Analysis Result")

	submit_button.click(
	fn=analyze_instagram_short,
	inputs=[video_input, question_input],
	outputs=output
	)

	if __name__ == "__main__":
	demo.launch()