ai-lab-tube

Sleeping

App Files Files Community

ai-lab-tube / src /components /interface /latent-engine /store /useLatentEngine.ts

jbilcke-hf HF Staff

yep, it works

8101ed0 about 1 year ago

raw

history blame

11.6 kB


	import { create } from "zustand"

	import { ClapProject } from "@/lib/clap/types"
	import { newClap } from "@/lib/clap/newClap"
	import { sleep } from "@/lib/utils/sleep"
	// import { getSegmentationCanvas } from "@/lib/on-device-ai/getSegmentationCanvas"

	import { LatentEngineStore } from "../core/types"
	import { resolveSegments } from "../resolvers/resolveSegments"
	import { fetchLatentClap } from "../core/fetchLatentClap"
	import { dataUriToBlob } from "@/app/api/utils/dataUriToBlob"
	import { parseClap } from "@/lib/clap/parseClap"
	import { InteractiveSegmenterResult, MPMask } from "@mediapipe/tasks-vision"
	import { segmentFrame } from "@/lib/on-device-ai/segmentFrameOnClick"
	import { drawSegmentation } from "../core/drawSegmentation"
	import { filterImage } from "@/lib/on-device-ai/filterImage"

	export const useLatentEngine = create<LatentEngineStore>((set, get) => ({
	width: 1024,
	height: 576,

	clap: newClap(),
	debug: true,

	streamType: "static",
	isStatic: false,
	isLive: false,
	isInteractive: false,

	isLoading: false, // true when a .clap is being downloaded and/or generated
	isLoaded: false, // true if a clap is loaded
	isPlaying: false,
	isPaused: true,

	// our "this is AI.. gasp!" disclaimer
	hasDisclaimer: true,
	hasPresentedDisclaimer: false,

	simulationPromise: undefined,
	simulationPending: false,
	simulationStartedAt: performance.now(),
	simulationEndedAt: performance.now(),
	simulationDurationInMs: 0,
	simulationVideoPlaybackFPS: 0,
	simulationRenderingTimeFPS: 0,

	renderingIntervalId: undefined,
	renderingIntervalDelayInMs: 2000, // 2 sec

	positionInMs: 0,
	durationInMs: 0,

	videoLayerElement: undefined,
	imageElement: undefined,
	videoElement: undefined,
	segmentationElement: undefined,

	videoLayer: undefined,
	videoBuffer: "A",
	videoBufferA: null,
	videoBufferB: undefined,

	segmentationLayer: undefined,

	interfaceLayer: undefined,
	interfaceBuffer: "A",
	interfaceBufferA: undefined,
	interfaceBufferB: undefined,

	setContainerDimension: ({ width, height }: { width: number; height: number }) => {
	set({
	width,
	height
	})
	},

	imagine: async (prompt: string): Promise<void> => {
	set({
	isLoaded: false,
	isLoading: true,
	})

	let clap: ClapProject \| undefined = undefined

	try {
	clap = await fetchLatentClap(prompt)
	} catch (err) {
	console.error(`generateAndLoad failed (${err})`)
	set({
	isLoading: false,
	})
	}

	if (!clap) { return }

	get().open(clap)
	},


	open: async (src?: string \| ClapProject \| Blob) => {
	const { debug } = get()
	set({
	isLoaded: false,
	isLoading: true,
	})

	let clap: ClapProject \| undefined = undefined

	try {
	clap = await parseClap(src, debug)
	} catch (err) {
	console.error(`failed to open the Clap: ${err}`)
	set({
	isLoading: false,
	})
	}

	if (!clap) { return }

	set({
	clap,
	isLoading: false,
	isLoaded: true,
	streamType: clap.meta.streamType,
	isStatic: clap.meta.streamType !== "interactive" && clap.meta.streamType !== "live",
	isLive: clap.meta.streamType === "live",
	isInteractive: clap.meta.streamType === "interactive",
	})
	},

	setVideoLayerElement: (videoLayerElement?: HTMLDivElement) => { set({ videoLayerElement }) },
	setImageElement: (imageElement?: HTMLImageElement) => { set({ imageElement }) },
	setVideoElement: (videoElement?: HTMLVideoElement) => { set({ videoElement }) },
	setSegmentationElement: (segmentationElement?: HTMLCanvasElement) => { set({ segmentationElement }) },

	processClickOnSegment: (result: InteractiveSegmenterResult) => {
	console.log(`processClickOnSegment: user clicked on something:`, result)

	const { videoElement, imageElement, segmentationElement, debug } = get()

	if (!result?.categoryMask) {
	if (debug) {
	console.log(`processClickOnSegment: no categoryMask, so we skip the click`)
	}
	return
	}

	try {
	if (debug) {
	console.log(`processClickOnSegment: callling drawSegmentation`)
	}

	const canvasMask: HTMLCanvasElement = drawSegmentation({
	mask: result.categoryMask,
	canvas: segmentationElement,
	backgroundImage: imageElement,
	fillStyle: "rgba(255, 255, 255, 1.0)"
	})
	// TODO: read the canvas te determine on what the user clicked

	if (debug) {
	console.log(`processClickOnSegment: filtering the original image`)
	}
	// filterImage(imageElement, canvasMask)

	if (debug) {
	console.log("processClickOnSegment: TODO call data.close() to free the memory!")
	}
	result.close()
	} catch (err) {
	console.error(`processClickOnSegment: something failed ${err}`)
	}
	},
	onClickOnSegmentationLayer: (event) => {

	const { videoElement, imageElement, segmentationLayer, segmentationElement, debug } = get()
	if (debug) {
	console.log("onClickOnSegmentationLayer")
	}
	// TODO use the videoElement if this is is video!
	if (!videoElement) { return }

	const box = event.currentTarget.getBoundingClientRect()

	const px = event.clientX
	const py = event.clientY

	const x = px / box.width
	const y = py / box.height
	console.log(`onClickOnSegmentationLayer: user clicked on `, { x, y, px, py, box, videoElement })

	const fn = async () => {
	const results: InteractiveSegmenterResult = await segmentFrame(videoElement, x, y)
	get().processClickOnSegment(results)
	}
	fn()
	},

	togglePlayPause: (): boolean => {
	const { isLoaded, isPlaying, renderingIntervalId, videoElement } = get()
	if (!isLoaded) { return false }

	const newValue = !isPlaying

	clearInterval(renderingIntervalId)

	if (newValue) {
	if (videoElement) {
	try {
	videoElement.play()
	} catch (err) {
	console.error(`togglePlayPause: failed to start the video (${err})`)
	}
	}
	set({
	isPlaying: true,
	renderingIntervalId: setTimeout(() => { get().runRenderingLoop() }, 0)
	})
	} else {
	if (videoElement) {
	try {
	videoElement.pause()
	} catch (err) {
	console.error(`togglePlayPause: failed to pause the video (${err})`)
	}
	}
	set({ isPlaying: false })
	}

	return newValue
	},


	play: (): boolean => {
	const { isLoaded, isPlaying, renderingIntervalId, renderingIntervalDelayInMs } = get()

	if (!isLoaded) { return false }

	if (isPlaying) { return true }

	clearInterval(renderingIntervalId)
	set({
	isPlaying: true,
	renderingIntervalId: setTimeout(() => { get().runRenderingLoop() }, 0)
	})

	return true
	},

	pause: (): boolean => {
	const { isLoaded, renderingIntervalId } = get()
	if (!isLoaded) { return false }

	clearInterval(renderingIntervalId)

	set({ isPlaying: false })

	return false
	},

	// a slow rendering function (async - might call a third party LLM)
	runSimulationLoop: async () => {
	const {
	isLoaded,
	isPlaying,
	clap,
	segmentationLayer,
	imageElement,
	videoElement,
	height,
	width,
	} = get()

	if (!isLoaded \|\| !isPlaying) {

	set({
	simulationPending: false,
	})

	return
	}

	set({
	simulationPending: true,
	simulationStartedAt: performance.now(),
	})

	try {

	/*
	// console.log("doing stuff")
	let timestamp = performance.now()

	if (imageElement) {
	// console.log("we have an image element:", imageElement)
	const segmentationLayer = await getSegmentationCanvas({
	frame: imageElement,
	timestamp,
	width,
	height,
	})
	set({ segmentationLayer })
	}
	*/

	// await sleep(500)

	// note: since we are asynchronous, we need to regularly check if
	// the user asked to pause the system or no
	if (get().isPlaying) {
	// console.log(`runSimulationLoop: rendering video content layer..`)
	// we only grab the first one



	const videoLayer = (await resolveSegments(clap, "video", 1)).at(0)

	if (get().isPlaying) {

	set({
	videoLayer
	})

	const { videoElement, imageElement, segmentationElement } = get()

	if (videoElement) {
	// yes, it is a very a dirty trick
	// yes, it will look back
	videoElement.defaultPlaybackRate = 0.5
	}

	const canvas = drawSegmentation({
	// no mask means this will effectively clear the canvas
	canvas: segmentationElement,
	backgroundImage: imageElement,
	})


	// console.log(`runSimulationLoop: rendered video content layer`)
	}
	}

	} catch (err) {
	console.error(`runSimulationLoop failed to render video layer ${err}`)
	}

	try {
	if (get().isPlaying) {
	// console.log(`runSimulationLoop: rendering UI layer..`)

	// note: for now we only display one element, to avoid handing a list of html elements
	const interfaceLayer = (await resolveSegments(clap, "interface", 1)).at(0)
	if (get().isPlaying) {
	set({
	interfaceLayer
	})

	// console.log(`runSimulationLoop: rendered UI layer`)
	}
	}
	} catch (err) {
	console.error(`runSimulationLoop failed to render UI layer ${err}`)
	}

	const simulationEndedAt = performance.now()
	const simulationDurationInMs = simulationEndedAt - get().simulationStartedAt
	const simulationDurationInSec =simulationDurationInMs / 1000

	// I've counted the frames manually, and we indeed have, in term of pure video playback,
	// 10 fps divided by 2 (the 0.5 playback factor)
	const videoFPS = 10
	const videoDurationInSec = 1
	const videoPlaybackSpeed = 0.5
	const simulationVideoPlaybackFPS = videoDurationInSec * videoFPS * videoPlaybackSpeed
	const simulationRenderingTimeFPS = (videoDurationInSec * videoFPS) / simulationDurationInSec
	set({
	simulationPending: false,
	simulationEndedAt,
	simulationDurationInMs,
	simulationVideoPlaybackFPS,
	simulationRenderingTimeFPS,
	})
	},

	// a fast sync rendering function; whose sole role is to filter the component
	// list to put into the buffer the one that should be displayed
	runRenderingLoop: () => {
	const {
	isLoaded,
	isPlaying,
	renderingIntervalId,
	renderingIntervalDelayInMs,
	simulationPromise,
	simulationPending,
	runSimulationLoop,
	imageElement,
	videoElement,
	} = get()
	if (!isLoaded) { return }
	if (!isPlaying) { return }
	try {
	// console.log(`runRenderingLoop: starting..`)

	// TODO: some operations with
	// console.log(`runRenderingLoop: ended`)
	} catch (err) {
	console.error(`runRenderingLoop failed ${err}`)
	}
	clearInterval(renderingIntervalId)
	set({
	isPlaying: true,
	simulationPromise: simulationPending ? simulationPromise : runSimulationLoop(),

	// TODO: use requestAnimationFrame somehow
	// https://developers.google.com/mediapipe/solutions/vision/image_segmenter/web_js
	renderingIntervalId: setTimeout(() => { get().runRenderingLoop() }, renderingIntervalDelayInMs)
	})

	},

	jumpTo: (positionInMs: number) => {
	set({ positionInMs })
	},
	jumpToStart: () => {
	set({ positionInMs: 0 })
	},
	}))