RobotHub-Frontend / src /lib /components /3d /elements /compute /modal /VideoInputConnectionModal.svelte
blanchon's picture
Update
3cdf7b9
<script lang="ts">
import * as Dialog from "@/components/ui/dialog";
import { video } from "@robothub/transport-server-client";
import type { video as videoTypes } from "@robothub/transport-server-client";
import { Button } from "@/components/ui/button";
import * as Card from "@/components/ui/card";
import { Badge } from "@/components/ui/badge";
import { toast } from "svelte-sonner";
import { settings } from "$lib/runes/settings.svelte";
import { videoManager } from "$lib/elements/video/VideoManager.svelte";
import type { RemoteCompute } from "$lib/elements/compute//RemoteCompute.svelte";
interface Props {
workspaceId: string;
open: boolean;
compute: RemoteCompute;
}
let { open = $bindable(), compute, workspaceId }: Props = $props();
let isConnecting = $state(false);
let selectedCameraName = $state("front");
let localStream: MediaStream | null = $state(null);
let videoProducer: any = null;
// Auto-refresh rooms when modal opens
$effect(() => {
if (open) {
videoManager.refreshRooms(workspaceId);
}
});
async function handleConnectLocalCamera() {
if (!compute.hasSession) {
toast.error("No Inference Session available. Create a session first.");
return;
}
isConnecting = true;
try {
// Get user media
const stream = await navigator.mediaDevices.getUserMedia({
video: true,
audio: false
});
localStream = stream;
// Get the camera room ID for the selected camera
const cameraRoomId = compute.sessionData?.camera_room_ids[selectedCameraName];
if (!cameraRoomId) {
throw new Error(`No room found for camera: ${selectedCameraName}`);
}
// Create video producer and connect to the camera room
videoProducer = new video.VideoProducer(settings.transportServerUrl);
// Connect to the EXISTING camera room (don't create new one)
const participantId = `frontend-camera-${selectedCameraName}-${Date.now()}`;
const success = await videoProducer.connect(workspaceId, cameraRoomId, participantId);
if (!success) {
throw new Error("Failed to connect to camera room");
}
// Start streaming
await videoProducer.startCamera();
toast.success(`Camera connected to Inference Session`, {
description: `Local camera streaming to ${selectedCameraName} input`
});
} catch (error) {
console.error("Camera connection error:", error);
toast.error("Failed to connect camera", {
description: error instanceof Error ? error.message : "Unknown error"
});
} finally {
isConnecting = false;
}
}
async function handleDisconnectCamera() {
try {
if (videoProducer) {
await videoProducer.stopStreaming();
await videoProducer.disconnect();
videoProducer = null;
}
if (localStream) {
localStream.getTracks().forEach((track) => track.stop());
localStream = null;
}
toast.success("Camera disconnected");
} catch (error) {
console.error("Disconnect error:", error);
toast.error("Error disconnecting camera");
}
}
// Cleanup on modal close
$effect(() => {
return () => {
if (!open) {
handleDisconnectCamera();
}
};
});
</script>
<Dialog.Root bind:open>
<Dialog.Content
class="max-h-[80vh] max-w-xl overflow-y-auto border-slate-600 bg-slate-900 text-slate-100"
>
<Dialog.Header class="pb-3">
<Dialog.Title class="flex items-center gap-2 text-lg font-bold text-slate-100">
<span class="icon-[mdi--video-input-component] size-5 text-green-400"></span>
Video Input - {compute.name || "No Compute Selected"}
</Dialog.Title>
<Dialog.Description class="text-sm text-slate-400">
Connect camera streams to provide visual input for AI inference
</Dialog.Description>
</Dialog.Header>
<div class="space-y-4">
<!-- Inference Session Status -->
<div
class="flex items-center justify-between rounded-lg border border-purple-500/30 bg-purple-900/20 p-3"
>
<div class="flex items-center gap-2">
<span class="icon-[mdi--brain] size-4 text-purple-400"></span>
<span class="text-sm font-medium text-purple-300">Inference Session</span>
</div>
{#if compute.hasSession}
<Badge variant="default" class="bg-purple-600 text-xs">
{compute.statusInfo.statusText}
</Badge>
{:else}
<Badge variant="secondary" class="text-xs text-slate-400">No Session</Badge>
{/if}
</div>
{#if !compute.hasSession}
<Card.Root class="border-yellow-500/30 bg-yellow-500/5">
<Card.Header>
<Card.Title class="flex items-center gap-2 text-base text-yellow-200">
<span class="icon-[mdi--alert] size-4"></span>
Inference Session Required
</Card.Title>
</Card.Header>
<Card.Content class="text-sm text-yellow-300">
You need to create an Inference Session before connecting video inputs. The session
defines which camera names are available for connection.
</Card.Content>
</Card.Root>
{:else}
<!-- Camera Selection and Connection -->
<Card.Root class="border-green-500/30 bg-green-500/5">
<Card.Header>
<Card.Title class="flex items-center gap-2 text-base text-green-200">
<span class="icon-[mdi--camera] size-4"></span>
Camera Connection
</Card.Title>
</Card.Header>
<Card.Content class="space-y-4">
<!-- Available Cameras -->
<div class="space-y-2">
<div class="text-sm font-medium text-green-300">Available Camera Inputs:</div>
<div class="grid grid-cols-2 gap-2">
{#each compute.sessionConfig?.cameraNames || [] as cameraName}
<button
onclick={() => (selectedCameraName = cameraName)}
class="rounded border p-2 text-left {selectedCameraName === cameraName
? 'border-green-500 bg-green-500/20'
: 'border-slate-600 bg-slate-800/50 hover:bg-slate-700/50'}"
>
<div class="text-sm font-medium">{cameraName}</div>
<div class="text-xs text-slate-400">
Room: {compute.sessionData?.camera_room_ids[cameraName]?.slice(-8)}
</div>
</button>
{/each}
</div>
</div>
<!-- Connection Status -->
<div class="rounded-lg border border-green-500/30 bg-green-900/20 p-3">
<div class="flex items-center justify-between">
<div>
<p class="text-sm font-medium text-green-300">
Selected Camera: {selectedCameraName}
</p>
<p class="text-xs text-green-400/70">
{localStream ? "Connected" : "Not Connected"}
</p>
</div>
{#if !localStream}
<Button
variant="default"
size="sm"
onclick={handleConnectLocalCamera}
disabled={isConnecting}
class="bg-green-600 text-xs hover:bg-green-700 disabled:opacity-50"
>
{#if isConnecting}
<span class="icon-[mdi--loading] mr-1 size-3 animate-spin"></span>
Connecting...
{:else}
<span class="icon-[mdi--camera] mr-1 size-3"></span>
Connect Camera
{/if}
</Button>
{:else}
<Button
variant="destructive"
size="sm"
onclick={handleDisconnectCamera}
class="text-xs"
>
<span class="icon-[mdi--close-circle] mr-1 size-3"></span>
Disconnect
</Button>
{/if}
</div>
</div>
<!-- Live Preview -->
{#if localStream}
<div class="space-y-2">
<div class="text-sm font-medium text-green-300">Live Preview:</div>
<div
class="aspect-video overflow-hidden rounded border border-green-500/30 bg-black/50"
>
<video
autoplay
muted
playsinline
class="h-full w-full object-cover"
onloadedmetadata={(e) => {
const video = e.target as HTMLVideoElement;
video.srcObject = localStream;
}}
></video>
</div>
</div>
{/if}
</Card.Content>
</Card.Root>
<!-- Session Camera Details -->
<Card.Root class="border-blue-500/30 bg-blue-500/5">
<Card.Header>
<Card.Title class="flex items-center gap-2 text-base text-blue-200">
<span class="icon-[mdi--information] size-4"></span>
Session Camera Details
</Card.Title>
</Card.Header>
<Card.Content>
<div class="space-y-2 text-xs">
{#each Object.entries(compute.sessionData?.camera_room_ids || {}) as [camera, roomId]}
<div class="flex items-center justify-between rounded bg-slate-800/50 p-2">
<span class="font-medium text-blue-300">{camera}</span>
<span class="font-mono text-blue-200">{roomId}</span>
</div>
{/each}
</div>
</Card.Content>
</Card.Root>
{/if}
<!-- Quick Info -->
<div class="rounded border border-slate-700 bg-slate-800/30 p-2 text-xs text-slate-500">
<span class="icon-[mdi--information] mr-1 size-3"></span>
Video inputs stream camera data to the AI model for visual processing. Each camera connects to
a dedicated room in the session.
</div>
</div>
</Dialog.Content>
</Dialog.Root>