Major UI overhaul plans; Other random docs

2026-02-15 00:43:41 -05:00
parent 1b86f66954
commit ef829f06a4
17 changed files with 5533 additions and 553 deletions
--- a/.agent/skills/speech-to-text/references/realtime-client-side.md
+++ b/.agent/skills/speech-to-text/references/realtime-client-side.md
@@ -0,0 +1,169 @@
+# Client-Side Real-Time Streaming
+
+Stream audio from the browser directly to ElevenLabs for real-time transcription.
+
+## Installation
+
+```bash
+# React
+npm install @elevenlabs/react @elevenlabs/elevenlabs-js
+
+# JavaScript
+npm install @elevenlabs/client @elevenlabs/elevenlabs-js
+```
+
+> **Warning:** Always use the `@elevenlabs/*` namespace for client-side packages.
+
+## Token Generation
+
+Client-side streaming requires a single-use token to protect your API key. Generate tokens on your backend:
+
+```typescript
+import { ElevenLabsClient } from "@elevenlabs/elevenlabs-js";
+
+const elevenlabs = new ElevenLabsClient({
+  apiKey: process.env.ELEVENLABS_API_KEY,
+});
+
+app.get("/scribe-token", yourAuthMiddleware, async (req, res) => {
+  const token = await elevenlabs.tokens.singleUse.create("realtime_scribe");
+  res.json(token);
+});
+```
+
+**Note:** Single-use tokens expire after 15 minutes.
+
+## React Implementation
+
+```typescript
+import { useScribe } from "@elevenlabs/react";
+
+function TranscriptionComponent() {
+  const [transcript, setTranscript] = useState("");
+
+  const scribe = useScribe({
+    modelId: "scribe_v2_realtime",
+    onPartialTranscript: (data) => {
+      // Show live feedback as user speaks
+      console.log("Partial:", data.text);
+    },
+    onCommittedTranscript: (data) => {
+      // Final transcript for this segment
+      setTranscript((prev) => prev + data.text);
+    },
+  });
+
+  const startRecording = async () => {
+    const tokenResponse = await fetch("/scribe-token");
+    const { token } = await tokenResponse.json();
+
+    await scribe.connect({
+      token,
+      microphone: {
+        echoCancellation: true,
+        noiseSuppression: true,
+        autoGainControl: true,
+      },
+    });
+  };
+
+  const stopRecording = () => {
+    scribe.disconnect();
+  };
+
+  return (
+    <div>
+      <div>Status: {scribe.status}</div>
+      <button onClick={startRecording}>Start</button>
+      <button onClick={stopRecording}>Stop</button>
+      <p>{transcript}</p>
+    </div>
+  );
+}
+```
+
+## JavaScript Implementation
+
+```typescript
+import { Scribe, RealtimeEvents } from "@elevenlabs/client";
+
+async function startTranscription() {
+  const tokenResponse = await fetch("/scribe-token");
+  const { token } = await tokenResponse.json();
+
+  const connection = Scribe.connect({
+    token,
+    modelId: "scribe_v2_realtime",
+    includeTimestamps: true,
+    microphone: {
+      echoCancellation: true,
+      noiseSuppression: true,
+      autoGainControl: true,
+    },
+  });
+
+  connection.on(RealtimeEvents.OPEN, () => {
+    console.log("Connected");
+  });
+
+  connection.on(RealtimeEvents.PARTIAL_TRANSCRIPT, (data) => {
+    console.log("Partial:", data.text);
+  });
+
+  connection.on(RealtimeEvents.COMMITTED_TRANSCRIPT, (data) => {
+    console.log("Committed:", data.text);
+  });
+
+  connection.on(RealtimeEvents.COMMITTED_TRANSCRIPT_WITH_TIMESTAMPS, (data) => {
+    for (const word of data.words) {
+      console.log(`${word.text}: ${word.start}s - ${word.end}s`);
+    }
+  });
+
+  connection.on(RealtimeEvents.ERROR, (error) => {
+    console.error("Error:", error);
+  });
+
+  connection.on(RealtimeEvents.CLOSE, () => {
+    console.log("Disconnected");
+  });
+
+  return connection;
+}
+```
+
+## Manual Audio Chunking
+
+For file uploads or custom audio sources, encode to PCM-16 and send in chunks:
+
+```typescript
+const chunkSize = 4096;
+
+for (let offset = 0; offset < pcmData.length; offset += chunkSize) {
+  const chunk = pcmData.slice(offset, offset + chunkSize);
+  const bytes = new Uint8Array(chunk.buffer);
+  const base64 = btoa(String.fromCharCode(...bytes));
+
+  scribe.sendAudio(base64);
+
+  // Simulate real-time streaming
+  await new Promise((resolve) => setTimeout(resolve, 50));
+}
+
+// Finalize transcription
+scribe.commit();
+```
+
+## Microphone Options
+
+| Option | Description |
+|--------|-------------|
+| `echoCancellation` | Remove echo from speakers |
+| `noiseSuppression` | Filter background noise |
+| `autoGainControl` | Normalize volume levels |
+
+## Security
+
+- Never expose your API key to the client
+- Always generate single-use tokens on your backend
+- Use authentication middleware to protect token endpoints