Spaces:

blanchon
/

RobotHub-Frontend

Running

App Files Files Community

RobotHub-Frontend / src /lib /components /3d /elements /compute /modal /VideoInputConnectionModal.svelte

blanchon

Update

3cdf7b9 3 days ago

raw

history blame contribute delete

9.15 kB

	<script lang="ts">
	import * as Dialog from "@/components/ui/dialog";
	import { video } from "@robothub/transport-server-client";
	import type { video as videoTypes } from "@robothub/transport-server-client";
	import { Button } from "@/components/ui/button";
	import * as Card from "@/components/ui/card";
	import { Badge } from "@/components/ui/badge";
	import { toast } from "svelte-sonner";
	import { settings } from "$lib/runes/settings.svelte";
	import { videoManager } from "$lib/elements/video/VideoManager.svelte";
	import type { RemoteCompute } from "$lib/elements/compute//RemoteCompute.svelte";

	interface Props {
	workspaceId: string;
	open: boolean;
	compute: RemoteCompute;
	}

	let { open = $bindable(), compute, workspaceId }: Props = $props();

	let isConnecting = $state(false);
	let selectedCameraName = $state("front");
	let localStream: MediaStream \| null = $state(null);
	let videoProducer: any = null;

	// Auto-refresh rooms when modal opens
	$effect(() => {
	if (open) {
	videoManager.refreshRooms(workspaceId);
	}
	});

	async function handleConnectLocalCamera() {
	if (!compute.hasSession) {
	toast.error("No Inference Session available. Create a session first.");
	return;
	}

	isConnecting = true;
	try {
	// Get user media
	const stream = await navigator.mediaDevices.getUserMedia({
	video: true,
	audio: false
	});
	localStream = stream;

	// Get the camera room ID for the selected camera
	const cameraRoomId = compute.sessionData?.camera_room_ids[selectedCameraName];
	if (!cameraRoomId) {
	throw new Error(`No room found for camera: ${selectedCameraName}`);
	}

	// Create video producer and connect to the camera room
	videoProducer = new video.VideoProducer(settings.transportServerUrl);

	// Connect to the EXISTING camera room (don't create new one)
	const participantId = `frontend-camera-${selectedCameraName}-${Date.now()}`;
	const success = await videoProducer.connect(workspaceId, cameraRoomId, participantId);

	if (!success) {
	throw new Error("Failed to connect to camera room");
	}

	// Start streaming
	await videoProducer.startCamera();

	toast.success(`Camera connected to Inference Session`, {
	description: `Local camera streaming to ${selectedCameraName} input`
	});
	} catch (error) {
	console.error("Camera connection error:", error);
	toast.error("Failed to connect camera", {
	description: error instanceof Error ? error.message : "Unknown error"
	});
	} finally {
	isConnecting = false;
	}
	}

	async function handleDisconnectCamera() {
	try {
	if (videoProducer) {
	await videoProducer.stopStreaming();
	await videoProducer.disconnect();
	videoProducer = null;
	}

	if (localStream) {
	localStream.getTracks().forEach((track) => track.stop());
	localStream = null;
	}

	toast.success("Camera disconnected");
	} catch (error) {
	console.error("Disconnect error:", error);
	toast.error("Error disconnecting camera");
	}
	}

	// Cleanup on modal close
	$effect(() => {
	return () => {
	if (!open) {
	handleDisconnectCamera();
	}
	};
	});
	</script>

	<Dialog.Root bind:open>
	<Dialog.Content
	class="max-h-[80vh] max-w-xl overflow-y-auto border-slate-600 bg-slate-900 text-slate-100"
	>
	<Dialog.Header class="pb-3">
	<Dialog.Title class="flex items-center gap-2 text-lg font-bold text-slate-100">
	<span class="icon-[mdi--video-input-component] size-5 text-green-400"></span>
	Video Input - {compute.name \|\| "No Compute Selected"}
	</Dialog.Title>
	<Dialog.Description class="text-sm text-slate-400">
	Connect camera streams to provide visual input for AI inference
	</Dialog.Description>
	</Dialog.Header>

	<div class="space-y-4">
	<!-- Inference Session Status -->
	<div
	class="flex items-center justify-between rounded-lg border border-purple-500/30 bg-purple-900/20 p-3"
	>
	<div class="flex items-center gap-2">
	<span class="icon-[mdi--brain] size-4 text-purple-400"></span>
	<span class="text-sm font-medium text-purple-300">Inference Session</span>
	</div>
	{#if compute.hasSession}
	<Badge variant="default" class="bg-purple-600 text-xs">
	{compute.statusInfo.statusText}
	</Badge>
	{:else}
	<Badge variant="secondary" class="text-xs text-slate-400">No Session</Badge>
	{/if}
	</div>

	{#if !compute.hasSession}
	<Card.Root class="border-yellow-500/30 bg-yellow-500/5">
	<Card.Header>
	<Card.Title class="flex items-center gap-2 text-base text-yellow-200">
	<span class="icon-[mdi--alert] size-4"></span>
	Inference Session Required
	</Card.Title>
	</Card.Header>
	<Card.Content class="text-sm text-yellow-300">
	You need to create an Inference Session before connecting video inputs. The session
	defines which camera names are available for connection.
	</Card.Content>
	</Card.Root>
	{:else}
	<!-- Camera Selection and Connection -->
	<Card.Root class="border-green-500/30 bg-green-500/5">
	<Card.Header>
	<Card.Title class="flex items-center gap-2 text-base text-green-200">
	<span class="icon-[mdi--camera] size-4"></span>
	Camera Connection
	</Card.Title>
	</Card.Header>
	<Card.Content class="space-y-4">
	<!-- Available Cameras -->
	<div class="space-y-2">
	<div class="text-sm font-medium text-green-300">Available Camera Inputs:</div>
	<div class="grid grid-cols-2 gap-2">
	{#each compute.sessionConfig?.cameraNames \|\| [] as cameraName}
	<button
	onclick={() => (selectedCameraName = cameraName)}
	class="rounded border p-2 text-left {selectedCameraName === cameraName
	? 'border-green-500 bg-green-500/20'
	: 'border-slate-600 bg-slate-800/50 hover:bg-slate-700/50'}"
	>
	<div class="text-sm font-medium">{cameraName}</div>
	<div class="text-xs text-slate-400">
	Room: {compute.sessionData?.camera_room_ids[cameraName]?.slice(-8)}
	</div>
	</button>
	{/each}
	</div>
	</div>

	<!-- Connection Status -->
	<div class="rounded-lg border border-green-500/30 bg-green-900/20 p-3">
	<div class="flex items-center justify-between">
	<div>
	<p class="text-sm font-medium text-green-300">
	Selected Camera: {selectedCameraName}
	</p>
	<p class="text-xs text-green-400/70">
	{localStream ? "Connected" : "Not Connected"}
	</p>
	</div>
	{#if !localStream}
	<Button
	variant="default"
	size="sm"
	onclick={handleConnectLocalCamera}
	disabled={isConnecting}
	class="bg-green-600 text-xs hover:bg-green-700 disabled:opacity-50"
	>
	{#if isConnecting}
	<span class="icon-[mdi--loading] mr-1 size-3 animate-spin"></span>
	Connecting...
	{:else}
	<span class="icon-[mdi--camera] mr-1 size-3"></span>
	Connect Camera
	{/if}
	</Button>
	{:else}
	<Button
	variant="destructive"
	size="sm"
	onclick={handleDisconnectCamera}
	class="text-xs"
	>
	<span class="icon-[mdi--close-circle] mr-1 size-3"></span>
	Disconnect
	</Button>
	{/if}
	</div>
	</div>

	<!-- Live Preview -->
	{#if localStream}
	<div class="space-y-2">
	<div class="text-sm font-medium text-green-300">Live Preview:</div>
	<div
	class="aspect-video overflow-hidden rounded border border-green-500/30 bg-black/50"
	>
	<video
	autoplay
	muted
	playsinline
	class="h-full w-full object-cover"
	onloadedmetadata={(e) => {
	const video = e.target as HTMLVideoElement;
	video.srcObject = localStream;
	}}
	></video>
	</div>
	</div>
	{/if}
	</Card.Content>
	</Card.Root>

	<!-- Session Camera Details -->
	<Card.Root class="border-blue-500/30 bg-blue-500/5">
	<Card.Header>
	<Card.Title class="flex items-center gap-2 text-base text-blue-200">
	<span class="icon-[mdi--information] size-4"></span>
	Session Camera Details
	</Card.Title>
	</Card.Header>
	<Card.Content>
	<div class="space-y-2 text-xs">
	{#each Object.entries(compute.sessionData?.camera_room_ids \|\| {}) as [camera, roomId]}
	<div class="flex items-center justify-between rounded bg-slate-800/50 p-2">
	<span class="font-medium text-blue-300">{camera}</span>
	<span class="font-mono text-blue-200">{roomId}</span>
	</div>
	{/each}
	</div>
	</Card.Content>
	</Card.Root>
	{/if}

	<!-- Quick Info -->
	<div class="rounded border border-slate-700 bg-slate-800/30 p-2 text-xs text-slate-500">
	<span class="icon-[mdi--information] mr-1 size-3"></span>
	Video inputs stream camera data to the AI model for visual processing. Each camera connects to
	a dedicated room in the session.
	</div>
	</div>
	</Dialog.Content>
	</Dialog.Root>