Spaces:

webnn
/

video-background-removal

Running

App Files Files Community

video-background-removal / src /main.js

ibelem's picture

Upload 9 files

8a7706c verified 5 months ago

history blame contribute delete

6.65 kB

	import * as transformers from "https://ibelem.github.io/transformersjs-dists/3.7.3_1.23.0-dev.20250906/transformers.js";
	transformers.env.backends.onnx.wasm.proxy = false;
	transformers.env.backends.onnx.wasm.simd = true;
	transformers.env.backends.onnx.wasm.numThreads = 1;
	transformers.env.backends.onnx.wasm.wasmPaths = "https://ibelem.github.io/transformersjs-dists/3.7.3_1.23.0-dev.20250906/";

	// Reference the elements that we will need
	const deviceLabel = document.getElementById("device");
	const status = document.getElementById("status");
	const container = document.getElementById("container");
	const canvas = document.getElementById("canvas");
	const outputCanvas = document.getElementById("output-canvas");
	const video = document.getElementById("video");
	const sizeSlider = document.getElementById("size");
	const sizeLabel = document.getElementById("size-value");
	const scaleSlider = document.getElementById("scale");
	const scaleLabel = document.getElementById("scale-value");

	function setStreamSize(width, height) {
	video.width = outputCanvas.width = canvas.width = Math.round(width);
	video.height = outputCanvas.height = canvas.height = Math.round(height);
	}

	status.textContent = "Loading model...";

	function getDeviceConfig(deviceParam, dtypeParam) {
	const defaultDevice = 'webnn-gpu';
	const defaultDtype = 'fp16';
	const webnnDevices = ['webnn-gpu', 'webnn-cpu', 'webnn-npu'];
	const supportedDtypes = ['fp16', 'fp32', 'int8'];

	const device = (deviceParam \|\| defaultDevice).toLowerCase();
	const dtype = (dtypeParam && supportedDtypes.includes(dtypeParam.toLowerCase()))
	? dtypeParam.toLowerCase()
	: defaultDtype;

	const FREE_DIMENSION_HEIGHT = 256;
	const FREE_DIMENSION_WIDTH = 320;

	const sessionOptions = webnnDevices.includes(device)
	? {
	freeDimensionOverrides: {
	batch_size: 1,
	height: FREE_DIMENSION_HEIGHT,
	width: FREE_DIMENSION_WIDTH,
	},
	logSeverityLevel: 0
	}
	: {
	logSeverityLevel: 0
	};

	return { device, dtype, sessionOptions };
	}

	const urlParams = new URLSearchParams(window.location.search);
	let { device, dtype, sessionOptions } = getDeviceConfig(urlParams.get('device'), urlParams.get('dtype'));

	let deviceValue = 'WebNN GPU';
	switch (device) {
	case 'webgpu':
	deviceValue = 'WebGPU';
	break;
	case 'webnn-gpu':
	deviceValue = 'WebNN GPU';
	break;
	case 'webnn-cpu':
	deviceValue = 'WebNN CPU';
	break;
	case 'webnn-npu':
	deviceValue = 'WebNN NPU';
	break;
	default:
	deviceValue = 'WebNN GPU';
	}

	deviceLabel.textContent = deviceValue;
	if (!['webgpu', 'webnn-gpu', 'webnn-cpu', 'webnn-npu'].includes(device)) {
	status.textContent = `Unsupported device ${device}. Falling back to WebNN GPU.`;
	device = 'webnn-gpu';
	}

	// Load model and processor
	const model_id = "Xenova/modnet";
	let pipe;
	try {
	pipe = await transformers.pipeline("background-removal", model_id, {
	device: device,
	dtype: dtype,
	session_options: sessionOptions
	});
	} catch (err) {
	status.textContent = err.message;
	alert(err.message);
	throw err;
	}

	// Set up controls
	let size = 256;
	pipe.processor.feature_extractor.size = { shortest_edge: size };
	sizeSlider.addEventListener("input", () => {
	size = Number(sizeSlider.value);
	pipe.processor.feature_extractor.size = { shortest_edge: size };
	sizeLabel.textContent = size;
	});
	sizeSlider.disabled = false;

	if (['webnn-gpu', 'webnn-cpu', 'webnn-npu'].includes(device)) {
	sizeSlider.disabled = true;
	}

	let scale = 0.5;
	scaleSlider.addEventListener("input", () => {
	scale = Number(scaleSlider.value);
	setStreamSize(video.videoWidth * scale, video.videoHeight * scale);
	scaleLabel.textContent = scale;
	});
	scaleSlider.disabled = false;

	status.textContent = "Ready";

	let isProcessing = false;
	let previousTime;
	const context = canvas.getContext("2d", { willReadFrequently: true });
	const outputContext = outputCanvas.getContext("2d", {
	willReadFrequently: true,
	});

	// Button logic for toggling video/output-canvas display
	const showVideoBtn = document.getElementById("show-video-btn");
	let videoToggleActive = false;

	function setVideoCanvasDisplay(showVideo) {
	if (showVideo) {
	video.style.display = "block";
	video.style.width = "100%";
	video.style.height = "100%";
	outputCanvas.style.display = "none";
	} else {
	video.style.display = "none";
	outputCanvas.style.display = "block";
	}
	}

	showVideoBtn.addEventListener("pointerdown", () => {
	if (isProcessing) {
	videoToggleActive = true;
	setVideoCanvasDisplay(true);
	}
	});
	showVideoBtn.addEventListener("pointerup", () => {
	if (videoToggleActive) {
	videoToggleActive = false;
	setVideoCanvasDisplay(false);
	}
	});
	showVideoBtn.addEventListener("pointerleave", () => {
	if (videoToggleActive) {
	videoToggleActive = false;
	setVideoCanvasDisplay(false);
	}
	});

	// Ensure initial state
	setVideoCanvasDisplay(false);
	function updateCanvas() {
	const { width, height } = canvas;

	if (!isProcessing) {
	isProcessing = true;
	(async function () {
	// Read the current frame from the video
	context.drawImage(video, 0, 0, width, height);
	const currentFrame = context.getImageData(0, 0, width, height);
	const image = new transformers.RawImage(currentFrame.data, width, height, 4);

	// Predict alpha matte
	const [output] = await pipe(image);

	// Draw the alpha matte on the canvas
	outputContext.putImageData(
	new ImageData(output.data, output.width, output.height),
	0,
	0,
	);

	if (previousTime !== undefined) {
	const fps = 1000 / (performance.now() - previousTime);
	status.textContent = `FPS: ${fps.toFixed(2)}`;
	}
	previousTime = performance.now();

	isProcessing = false;
	})();
	}

	window.requestAnimationFrame(updateCanvas);
	}

	// Start the video stream
	navigator.mediaDevices
	.getUserMedia(
	{ video: true }, // Ask for video
	)
	.then((stream) => {
	// Set up the video and canvas elements.
	video.srcObject = stream;
	video.play();

	const videoTrack = stream.getVideoTracks()[0];
	const { width, height } = videoTrack.getSettings();

	setStreamSize(width * scale, height * scale);

	// Set container width and height depending on the image aspect ratio
	const ar = width / height;
	const [cw, ch] = ar > 720 / 405 ? [720, 720 / ar] : [405 * ar, 405];
	container.style.width = `${cw}px`;
	container.style.height = `${ch}px`;

	// Start the animation loop
	setTimeout(updateCanvas, 50);
	})
	.catch((error) => {
	alert(error);
	});