Compare commits
13 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
| 054e4057d8 | |||
| 3943e79bb1 | |||
| 87f4317c15 | |||
| 50aa793910 | |||
| 5efc9865a8 | |||
| 949c573c49 | |||
| f7f450a09d | |||
| 81f7c38383 | |||
| 2c785cb37a | |||
| 57e65b061c | |||
| aa54765b03 | |||
| 8929bc99bb | |||
| 0428c06612 |
+37
-7
@@ -1,20 +1,50 @@
|
|||||||
# ARIA Environment Configuration
|
# ════════════════════════════════════════════════
|
||||||
# Copy to .env and fill in values
|
# ARIA — Umgebungsvariablen
|
||||||
|
# Kopieren nach .env und Werte eintragen
|
||||||
|
# ════════════════════════════════════════════════
|
||||||
|
|
||||||
# Auth token for ARIA Core (generate a long random string)
|
# ── ARIA Auth Token ──────────────────────────────
|
||||||
# openssl rand -hex 32
|
# Authentifizierung fuer den OpenClaw Gateway (aria-core).
|
||||||
|
# Wird von Diagnostic, Bridge und App genutzt um sich am Gateway anzumelden.
|
||||||
|
# Alle Services die mit aria-core kommunizieren brauchen diesen Token.
|
||||||
|
# Generieren: openssl rand -hex 32
|
||||||
ARIA_AUTH_TOKEN=change-me-to-a-long-random-string
|
ARIA_AUTH_TOKEN=change-me-to-a-long-random-string
|
||||||
|
|
||||||
# RVS — Rendezvous-Server (Bridge + App verbinden sich hierüber)
|
# ── RVS — Rendezvous-Server ─────────────────────
|
||||||
|
# Der RVS ist ein WebSocket-Relay im Rechenzentrum.
|
||||||
|
# App, Bridge, Diagnostic und XTTS-Bridge verbinden sich hierueber.
|
||||||
|
# Alle muessen den gleichen Host, Port und Token nutzen.
|
||||||
|
|
||||||
|
# Hostname des RVS-Servers (z.B. rvs.example.de oder mobil.hacker-net.de)
|
||||||
RVS_HOST=rvs.example.de
|
RVS_HOST=rvs.example.de
|
||||||
|
|
||||||
|
# Port auf dem der RVS laeuft (muss mit rvs/docker-compose.yml uebereinstimmen)
|
||||||
RVS_PORT=443
|
RVS_PORT=443
|
||||||
|
|
||||||
|
# TLS (wss://) verwenden? true = verschluesselt, false = unverschluesselt (ws://)
|
||||||
RVS_TLS=true
|
RVS_TLS=true
|
||||||
|
|
||||||
# Bei TLS-Fehler automatisch auf ws:// (ohne TLS) fallback?
|
# Bei TLS-Fehler automatisch auf ws:// (ohne TLS) fallback?
|
||||||
# true = Fallback erlaubt, false = nur mit TLS verbinden
|
# Nuetzlich wenn kein TLS-Zertifikat vorhanden (z.B. Entwicklung)
|
||||||
RVS_TLS_FALLBACK=true
|
RVS_TLS_FALLBACK=true
|
||||||
|
|
||||||
|
# Pairing-Token: Wer den gleichen Token hat, landet im gleichen RVS-Room.
|
||||||
|
# Wird von generate-token.sh automatisch generiert und hier eingetragen.
|
||||||
|
# Die Android App bekommt den Token per QR-Code beim Pairing.
|
||||||
|
# WICHTIG: Muss auf ARIA-VM, Gaming-PC (xtts/.env) und App identisch sein!
|
||||||
|
# Generieren: ./generate-token.sh (traegt den Token automatisch ein)
|
||||||
RVS_TOKEN=
|
RVS_TOKEN=
|
||||||
|
|
||||||
# Gitea (for release.sh — Kennwort wird interaktiv abgefragt)
|
# ── Gitea — Release-Verwaltung ───────────────────
|
||||||
|
# Wird von release.sh genutzt um APKs auf Gitea zu veroeffentlichen.
|
||||||
|
# Kennwort wird beim Release interaktiv abgefragt (nicht in .env!).
|
||||||
GITEA_URL=https://git.hacker-net.de
|
GITEA_URL=https://git.hacker-net.de
|
||||||
GITEA_REPO=Hacker-Software/ARIA-AGENT
|
GITEA_REPO=Hacker-Software/ARIA-AGENT
|
||||||
GITEA_USER=duffyduck
|
GITEA_USER=duffyduck
|
||||||
|
|
||||||
|
# ── Auto-Update — APK auf RVS-Server kopieren ───
|
||||||
|
# SSH-Ziel fuer scp: release.sh kopiert die APK dorthin.
|
||||||
|
# Der RVS-Server stellt sie dann per WebSocket an die App bereit.
|
||||||
|
# Format: user@host (z.B. root@aria-rvs oder root@rvs.example.de)
|
||||||
|
# Leer lassen = Auto-Update ueberspringen, APK manuell auf RVS kopieren.
|
||||||
|
RVS_UPDATE_HOST=
|
||||||
|
|||||||
@@ -103,16 +103,31 @@ cd ~/ARIA-AGENT
|
|||||||
cp .env.example .env
|
cp .env.example .env
|
||||||
```
|
```
|
||||||
|
|
||||||
`.env` Datei editieren:
|
`.env` Datei editieren (Details siehe `.env.example`):
|
||||||
```bash
|
```bash
|
||||||
|
# Gateway-Auth: Alle Services die mit aria-core reden brauchen diesen Token
|
||||||
|
# Diagnostic, Bridge, App nutzen ihn fuer den WebSocket-Handshake
|
||||||
ARIA_AUTH_TOKEN= # openssl rand -hex 32
|
ARIA_AUTH_TOKEN= # openssl rand -hex 32
|
||||||
|
|
||||||
|
# RVS-Verbindung: Hostname + Port deines Rendezvous-Servers
|
||||||
RVS_HOST= # z.B. rvs.hackersoft.de
|
RVS_HOST= # z.B. rvs.hackersoft.de
|
||||||
RVS_PORT=443
|
RVS_PORT=443
|
||||||
RVS_TLS=true
|
RVS_TLS=true
|
||||||
RVS_TLS_FALLBACK=true
|
RVS_TLS_FALLBACK=true
|
||||||
RVS_TOKEN= # wird von generate-token.sh automatisch gesetzt
|
|
||||||
|
# Pairing-Token: Verbindet App, Bridge, Diagnostic und XTTS im gleichen RVS-Room
|
||||||
|
# MUSS auf allen Geraeten identisch sein (ARIA-VM, Gaming-PC, App)
|
||||||
|
# Wird von generate-token.sh automatisch generiert und eingetragen
|
||||||
|
RVS_TOKEN= # ./generate-token.sh
|
||||||
|
|
||||||
|
# Optional: SSH-Host des RVS-Servers fuer Auto-Update (z.B. root@aria-rvs)
|
||||||
|
RVS_UPDATE_HOST=
|
||||||
```
|
```
|
||||||
|
|
||||||
|
**Zwei Tokens, zwei Zwecke:**
|
||||||
|
- **ARIA_AUTH_TOKEN**: Authentifizierung am OpenClaw Gateway (aria-core). Wer diesen Token hat, kann ARIA Befehle geben.
|
||||||
|
- **RVS_TOKEN**: Pairing-Token fuer den Rendezvous-Server. Alle Geraete mit dem gleichen Token landen im gleichen "Room" und koennen kommunizieren. Die App bekommt diesen Token per QR-Code.
|
||||||
|
|
||||||
### 2. Claude CLI einloggen (Proxy-Auth)
|
### 2. Claude CLI einloggen (Proxy-Auth)
|
||||||
|
|
||||||
Der Proxy-Container nutzt deine Claude Max Subscription. Die Credentials muessen
|
Der Proxy-Container nutzt deine Claude Max Subscription. Die Credentials muessen
|
||||||
|
|||||||
@@ -79,8 +79,8 @@ android {
|
|||||||
applicationId "com.ariacockpit"
|
applicationId "com.ariacockpit"
|
||||||
minSdkVersion rootProject.ext.minSdkVersion
|
minSdkVersion rootProject.ext.minSdkVersion
|
||||||
targetSdkVersion rootProject.ext.targetSdkVersion
|
targetSdkVersion rootProject.ext.targetSdkVersion
|
||||||
versionCode 206
|
versionCode 208
|
||||||
versionName "0.0.2.6"
|
versionName "0.0.2.8"
|
||||||
// Fallback fuer Libraries mit Product Flavors
|
// Fallback fuer Libraries mit Product Flavors
|
||||||
missingDimensionStrategy 'react-native-camera', 'general'
|
missingDimensionStrategy 'react-native-camera', 'general'
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
{
|
{
|
||||||
"name": "aria-cockpit",
|
"name": "aria-cockpit",
|
||||||
"version": "0.0.2.6",
|
"version": "0.0.2.8",
|
||||||
"private": true,
|
"private": true,
|
||||||
"scripts": {
|
"scripts": {
|
||||||
"android": "react-native run-android",
|
"android": "react-native run-android",
|
||||||
|
|||||||
@@ -748,7 +748,7 @@ const SettingsScreen: React.FC = () => {
|
|||||||
<Text style={styles.sectionTitle}>{'\u00DC'}ber</Text>
|
<Text style={styles.sectionTitle}>{'\u00DC'}ber</Text>
|
||||||
<View style={styles.card}>
|
<View style={styles.card}>
|
||||||
<Text style={styles.aboutTitle}>ARIA Cockpit</Text>
|
<Text style={styles.aboutTitle}>ARIA Cockpit</Text>
|
||||||
<Text style={styles.aboutVersion}>Version 0.0.2.6 </Text>
|
<Text style={styles.aboutVersion}>Version 0.0.2.8 </Text>
|
||||||
<Text style={styles.aboutInfo}>
|
<Text style={styles.aboutInfo}>
|
||||||
Stefans Kommandozentrale f{'\u00FC'}r ARIA.{'\n'}
|
Stefans Kommandozentrale f{'\u00FC'}r ARIA.{'\n'}
|
||||||
Gebaut mit React Native + TypeScript.
|
Gebaut mit React Native + TypeScript.
|
||||||
|
|||||||
@@ -58,6 +58,8 @@ class AudioService {
|
|||||||
// Audio-Queue fuer sequentielle TTS-Wiedergabe
|
// Audio-Queue fuer sequentielle TTS-Wiedergabe
|
||||||
private audioQueue: string[] = [];
|
private audioQueue: string[] = [];
|
||||||
private isPlaying: boolean = false;
|
private isPlaying: boolean = false;
|
||||||
|
private preloadedSound: Sound | null = null;
|
||||||
|
private preloadedPath: string = '';
|
||||||
|
|
||||||
// VAD State
|
// VAD State
|
||||||
private vadEnabled: boolean = false;
|
private vadEnabled: boolean = false;
|
||||||
@@ -220,35 +222,62 @@ class AudioService {
|
|||||||
}
|
}
|
||||||
|
|
||||||
this.isPlaying = true;
|
this.isPlaying = true;
|
||||||
const base64Data = this.audioQueue.shift()!;
|
|
||||||
|
|
||||||
try {
|
// Preloaded Sound verwenden wenn verfuegbar, sonst neu laden
|
||||||
const tmpPath = `${RNFS.CachesDirectoryPath}/aria_tts_${Date.now()}.wav`;
|
let sound: Sound;
|
||||||
await RNFS.writeFile(tmpPath, base64Data, 'base64');
|
let soundPath: string;
|
||||||
|
|
||||||
this.currentSound = new Sound(tmpPath, '', (error) => {
|
if (this.preloadedSound) {
|
||||||
if (error) {
|
sound = this.preloadedSound;
|
||||||
console.error('[Audio] Fehler beim Laden:', error);
|
soundPath = this.preloadedPath;
|
||||||
RNFS.unlink(tmpPath).catch(() => {});
|
this.preloadedSound = null;
|
||||||
this._playNext();
|
this.preloadedPath = '';
|
||||||
return;
|
// Daten aus Queue entfernen (wurde schon preloaded)
|
||||||
}
|
this.audioQueue.shift();
|
||||||
this.currentSound?.play((success) => {
|
} else {
|
||||||
if (success) {
|
const base64Data = this.audioQueue.shift()!;
|
||||||
console.log('[Audio] Wiedergabe abgeschlossen');
|
try {
|
||||||
} else {
|
soundPath = `${RNFS.CachesDirectoryPath}/aria_tts_${Date.now()}.wav`;
|
||||||
console.warn('[Audio] Wiedergabe fehlgeschlagen');
|
await RNFS.writeFile(soundPath, base64Data, 'base64');
|
||||||
}
|
sound = await new Promise<Sound>((resolve, reject) => {
|
||||||
this.currentSound?.release();
|
const s = new Sound(soundPath, '', (err) => err ? reject(err) : resolve(s));
|
||||||
this.currentSound = null;
|
|
||||||
RNFS.unlink(tmpPath).catch(() => {});
|
|
||||||
// Naechstes Audio abspielen
|
|
||||||
this._playNext();
|
|
||||||
});
|
});
|
||||||
});
|
} catch (err) {
|
||||||
} catch (err) {
|
console.error('[Audio] Laden fehlgeschlagen:', err);
|
||||||
console.error('[Audio] Wiedergabefehler:', err);
|
this._playNext();
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
this.currentSound = sound;
|
||||||
|
|
||||||
|
// Naechstes Audio schon vorbereiten waehrend dieses abspielt
|
||||||
|
this._preloadNext();
|
||||||
|
|
||||||
|
sound.play((success) => {
|
||||||
|
if (!success) console.warn('[Audio] Wiedergabe fehlgeschlagen');
|
||||||
|
sound.release();
|
||||||
|
this.currentSound = null;
|
||||||
|
RNFS.unlink(soundPath).catch(() => {});
|
||||||
this._playNext();
|
this._playNext();
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
/** Naechstes Audio im Hintergrund vorladen (verhindert Stottern) */
|
||||||
|
private async _preloadNext(): Promise<void> {
|
||||||
|
if (this.audioQueue.length === 0 || this.preloadedSound) return;
|
||||||
|
|
||||||
|
const base64Data = this.audioQueue[0]; // Nicht shift — bleibt in Queue
|
||||||
|
try {
|
||||||
|
const tmpPath = `${RNFS.CachesDirectoryPath}/aria_tts_pre_${Date.now()}.wav`;
|
||||||
|
await RNFS.writeFile(tmpPath, base64Data, 'base64');
|
||||||
|
this.preloadedSound = await new Promise<Sound>((resolve, reject) => {
|
||||||
|
const s = new Sound(tmpPath, '', (err) => err ? reject(err) : resolve(s));
|
||||||
|
});
|
||||||
|
this.preloadedPath = tmpPath;
|
||||||
|
} catch {
|
||||||
|
this.preloadedSound = null;
|
||||||
|
this.preloadedPath = '';
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -261,6 +290,12 @@ class AudioService {
|
|||||||
this.currentSound.release();
|
this.currentSound.release();
|
||||||
this.currentSound = null;
|
this.currentSound = null;
|
||||||
}
|
}
|
||||||
|
if (this.preloadedSound) {
|
||||||
|
this.preloadedSound.release();
|
||||||
|
this.preloadedSound = null;
|
||||||
|
if (this.preloadedPath) RNFS.unlink(this.preloadedPath).catch(() => {});
|
||||||
|
this.preloadedPath = '';
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// --- Status & Callbacks ---
|
// --- Status & Callbacks ---
|
||||||
|
|||||||
+1
-1
@@ -18,7 +18,7 @@ services:
|
|||||||
claude-max-api"
|
claude-max-api"
|
||||||
volumes:
|
volumes:
|
||||||
- ~/.claude:/root/.claude # Claude CLI Auth (Credentials in /root/.claude/.credentials.json)
|
- ~/.claude:/root/.claude # Claude CLI Auth (Credentials in /root/.claude/.credentials.json)
|
||||||
- ./aria-data/ssh:/root/.ssh:ro # SSH Keys fuer VM-Zugriff (aria-wohnung)
|
- ./aria-data/ssh:/root/.ssh # SSH Keys fuer VM-Zugriff (aria-wohnung, rw fuer ARIA)
|
||||||
- aria-shared:/shared # Shared Volume fuer Datei-Austausch (Uploads von App)
|
- aria-shared:/shared # Shared Volume fuer Datei-Austausch (Uploads von App)
|
||||||
environment:
|
environment:
|
||||||
- HOST=0.0.0.0
|
- HOST=0.0.0.0
|
||||||
|
|||||||
@@ -18,19 +18,35 @@
|
|||||||
- [x] RVS Nachrichten vom Smartphone gehen durch
|
- [x] RVS Nachrichten vom Smartphone gehen durch
|
||||||
- [x] Stimmen-Einstellungen (Ramona/Thorsten, Speed pro Stimme)
|
- [x] Stimmen-Einstellungen (Ramona/Thorsten, Speed pro Stimme)
|
||||||
- [x] Highlight-Trigger konfigurierbar in Diagnostic
|
- [x] Highlight-Trigger konfigurierbar in Diagnostic
|
||||||
|
- [x] XTTS v2 Integration (Gaming-PC, GPU, Voice Cloning)
|
||||||
|
- [x] XTTS Voice Cloning (Audio-Samples hochladen, eigene Stimme)
|
||||||
|
- [x] TTS Engine waehlbar (Piper/XTTS) in Diagnostic + App
|
||||||
|
- [x] Auto-Update System (APK via RVS WebSocket)
|
||||||
|
- [x] Audio-Queue (sequentielle Wiedergabe, kein Ueberlappen)
|
||||||
|
|
||||||
## Offen
|
## Offen
|
||||||
|
|
||||||
### TTS / Stimmen
|
### Bugs (Prioritaet)
|
||||||
- [ ] TTS Engine waehlbar: Piper (CPU, schnell) oder Coqui XTTS v2 (GPU, natuerlicher)
|
- [ ] Session-Persistenz: Bei Container-Restart wird immer aria-bridge geladen statt die zuletzt gewaehlte Session. Wird nicht persistent gespeichert.
|
||||||
- [ ] Piper Voices Download ueber Diagnostic (neue Sprachen/Stimmen)
|
- [ ] App: Textnachrichten, Bilder und Anhaenge werden von ARIA nicht beantwortet — nur Sprachnachrichten funktionieren.
|
||||||
- [ ] Coqui XTTS v2 Integration (braucht GPU, bessere deutsche Stimme)
|
- [ ] App: Audioausgabe hoert ab und zu einfach auf (mitten im Satz oder zwischen Chunks)
|
||||||
|
- [ ] Auto-Update: release.sh kopiert APK nicht auf den RVS-Server (rvs/updates/ bleibt leer)
|
||||||
|
- [ ] App: Kein Auto-Scroll zur letzten Nachricht beim App-Start (soll direkt springen, nicht animiert scrollen)
|
||||||
|
- [ ] App: Bei neuen Nachrichten soll automatisch zur letzten Nachricht gescrollt werden
|
||||||
|
|
||||||
### App
|
### App Features
|
||||||
|
- [ ] App: Zu Anhaengen noch Text/Sprache hinzufuegen koennen (z.B. Bild senden + "Was siehst du?")
|
||||||
- [ ] Wake Word on-device (Porcupine "ARIA" Keyword, Phase 2)
|
- [ ] Wake Word on-device (Porcupine "ARIA" Keyword, Phase 2)
|
||||||
- [ ] Chat-History zuverlaessiger laden (AsyncStorage Race Condition)
|
- [ ] Chat-History zuverlaessiger laden (AsyncStorage Race Condition)
|
||||||
|
- [ ] Background Audio Service (TTS auch bei minimierter App)
|
||||||
|
|
||||||
|
### TTS / Audio
|
||||||
|
- [ ] XTTS Audio-Streaming verbessern (minimales Stottern bei Chunk-Uebergaengen)
|
||||||
|
- [ ] Audio-Normalisierung (Lautstaerke zwischen Chunks angleichen)
|
||||||
|
- [ ] Piper Voices Download ueber Diagnostic (neue Sprachen/Stimmen)
|
||||||
|
|
||||||
### Architektur
|
### Architektur
|
||||||
- [ ] Bilder: Claude Vision direkt nutzen (aktuell nur Dateipfad an ARIA)
|
- [ ] Bilder: Claude Vision direkt nutzen (aktuell nur Dateipfad an ARIA)
|
||||||
- [ ] Auto-Compacting und Memory/Brain Verwaltung (SQLite?)
|
- [ ] Auto-Compacting und Memory/Brain Verwaltung (SQLite?)
|
||||||
- [ ] Diagnostic: System-Info Tab (Container-Status, Disk, RAM, CPU)
|
- [ ] Diagnostic: System-Info Tab (Container-Status, Disk, RAM, CPU)
|
||||||
|
- [ ] RVS Zombie-Connections endgueltig loesen (WebRTC statt WebSocket?)
|
||||||
|
|||||||
+36
-14
@@ -100,44 +100,66 @@ async function handleTTSRequest(payload) {
|
|||||||
// Markdown entfernen
|
// Markdown entfernen
|
||||||
const cleanText = text.replace(/\*\*([^*]+)\*\*/g, "$1").trim();
|
const cleanText = text.replace(/\*\*([^*]+)\*\*/g, "$1").trim();
|
||||||
|
|
||||||
// Text in Saetze aufteilen (sequentiell rendern fuer korrekte Reihenfolge)
|
// Text in Saetze aufteilen, dann zu Chunks von 2-3 Saetzen zusammenfassen
|
||||||
const sentences = cleanText.split(/(?<=[.!?])\s+/).map(s => s.trim()).filter(s => s.length > 0);
|
// (mehr Kontext = konsistentere Stimme/Lautstaerke, aber nicht zu lang fuer WebSocket)
|
||||||
if (sentences.length === 0) return;
|
const sentences = cleanText.split(/(?<=[.!?])\s+/)
|
||||||
|
.map(s => s.trim())
|
||||||
|
.filter(s => s.length > 0)
|
||||||
|
.map(s => s.replace(/[.]+$/, '')); // Punkt am Ende entfernen
|
||||||
|
|
||||||
log(`TTS-Request: "${cleanText.slice(0, 60)}..." (${sentences.length} Saetze, voice: ${voice || "default"}, lang: ${language || "de"})`);
|
const MAX_CHUNK_CHARS = 150; // Max ~150 Zeichen pro Chunk (schnelles Rendering, Preloading reicht)
|
||||||
|
const chunks = [];
|
||||||
|
let currentChunk = '';
|
||||||
|
for (const sentence of sentences) {
|
||||||
|
if (currentChunk && (currentChunk.length + sentence.length + 2) > MAX_CHUNK_CHARS) {
|
||||||
|
chunks.push(currentChunk);
|
||||||
|
currentChunk = sentence;
|
||||||
|
} else {
|
||||||
|
currentChunk = currentChunk ? currentChunk + ', ' + sentence : sentence;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
if (currentChunk) chunks.push(currentChunk);
|
||||||
|
if (chunks.length === 0) return;
|
||||||
|
|
||||||
|
log(`TTS-Request: "${cleanText.slice(0, 60)}..." (${sentences.length} Saetze → ${chunks.length} Chunks, voice: ${voice || "default"}, lang: ${language || "de"})`);
|
||||||
|
|
||||||
try {
|
try {
|
||||||
const voiceSample = voice ? path.join(VOICES_DIR, `${voice}.wav`) : null;
|
const voiceSample = voice ? path.join(VOICES_DIR, `${voice}.wav`) : null;
|
||||||
const hasCustomVoice = voiceSample && fs.existsSync(voiceSample);
|
const hasCustomVoice = voiceSample && fs.existsSync(voiceSample);
|
||||||
|
|
||||||
// Jeden Satz sequentiell rendern und sofort senden
|
// Streaming: Chunk rendern → sofort senden → naechster Chunk
|
||||||
for (let i = 0; i < sentences.length; i++) {
|
// App spielt mit Preloading-Queue nahtlos ab
|
||||||
const sentence = sentences[i];
|
let sentCount = 0;
|
||||||
|
|
||||||
|
for (let i = 0; i < chunks.length; i++) {
|
||||||
|
const chunk = chunks[i];
|
||||||
try {
|
try {
|
||||||
const audioBuffer = await callXTTSAPI(sentence, language || "de", hasCustomVoice ? voiceSample : null);
|
const audioBuffer = await callXTTSAPI(chunk, language || "de", hasCustomVoice ? voiceSample : null);
|
||||||
|
|
||||||
if (audioBuffer && audioBuffer.length > 100) {
|
if (audioBuffer && audioBuffer.length > 100) {
|
||||||
const base64 = audioBuffer.toString("base64");
|
log(`TTS [${i + 1}/${chunks.length}]: ${(audioBuffer.length / 1024).toFixed(0)}KB — "${chunk.slice(0, 50)}"`);
|
||||||
log(`TTS [${i + 1}/${sentences.length}]: ${audioBuffer.length} bytes (${(audioBuffer.length / 1024).toFixed(0)}KB) — "${sentence.slice(0, 40)}..."`);
|
|
||||||
|
|
||||||
sendToRVS({
|
sendToRVS({
|
||||||
type: "xtts_response",
|
type: "xtts_response",
|
||||||
payload: {
|
payload: {
|
||||||
requestId: `${requestId || ""}_${i}`,
|
requestId: `${requestId || ""}_${i}`,
|
||||||
base64,
|
base64: audioBuffer.toString("base64"),
|
||||||
mimeType: "audio/wav",
|
mimeType: "audio/wav",
|
||||||
voice: voice || "default",
|
voice: voice || "default",
|
||||||
engine: "xtts",
|
engine: "xtts",
|
||||||
|
part: i + 1,
|
||||||
|
totalParts: chunks.length,
|
||||||
},
|
},
|
||||||
timestamp: Date.now(),
|
timestamp: Date.now(),
|
||||||
});
|
});
|
||||||
|
sentCount++;
|
||||||
}
|
}
|
||||||
} catch (sentenceErr) {
|
} catch (chunkErr) {
|
||||||
log(`TTS [${i + 1}/${sentences.length}] Fehler: ${sentenceErr.message} — ueberspringe`);
|
log(`TTS [${i + 1}/${chunks.length}] Fehler: ${chunkErr.message} — ueberspringe`);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
log(`TTS komplett: ${sentences.length} Saetze gerendert`);
|
log(`TTS komplett: ${sentCount}/${chunks.length} Chunks gestreamt`);
|
||||||
} catch (err) {
|
} catch (err) {
|
||||||
log(`TTS Fehler: ${err.message}`);
|
log(`TTS Fehler: ${err.message}`);
|
||||||
sendToRVS({
|
sendToRVS({
|
||||||
|
|||||||
Reference in New Issue
Block a user