Spaces:
Running
Running
Update index.html
Browse files- index.html +78 -93
index.html
CHANGED
@@ -3,26 +3,29 @@
|
|
3 |
<head>
|
4 |
<meta charset="UTF-8" />
|
5 |
<meta name="viewport" content="width=device-width, initial-scale=1" />
|
6 |
-
<title>XTTVS-MED | Multilingual Voice-to-Voice Demo Suite</title>
|
7 |
|
8 |
<!-- Bootstrap -->
|
9 |
-
<link
|
|
|
|
|
|
|
10 |
|
11 |
<!-- Mermaid -->
|
12 |
<script src="https://cdn.jsdelivr.net/npm/mermaid@10/dist/mermaid.min.js"></script>
|
13 |
<script>
|
14 |
mermaid.initialize({
|
15 |
-
startOnLoad:true,
|
16 |
-
theme:'dark',
|
17 |
-
flowchart:{fontSize:'16px'},
|
18 |
-
sequence:{actorFontSize:'14px'}
|
19 |
});
|
20 |
</script>
|
21 |
|
22 |
<style>
|
23 |
:root{
|
24 |
-
--bg:#070707;
|
25 |
-
--txt:#e5e5e5;
|
26 |
}
|
27 |
*{box-sizing:border-box}
|
28 |
body{margin:0;background:var(--bg);color:var(--txt);font-family:'Fira Code',monospace}
|
@@ -30,20 +33,20 @@
|
|
30 |
h1,h2,h3{color:var(--accent)}
|
31 |
.container-lg{max-width:1160px;padding:2rem 1rem}
|
32 |
.section{margin-bottom:3.2rem}
|
33 |
-
.panel{background:var(--panel);padding:1.
|
34 |
-
/*
|
35 |
pre{
|
36 |
background:var(--card);
|
37 |
color:#c0f6ff;
|
38 |
-
padding:1.1rem 1.
|
39 |
border-radius:.55rem;
|
40 |
font-size:.9rem;
|
41 |
overflow-x:auto;
|
42 |
-
margin:1.
|
43 |
}
|
44 |
-
code{background:#222;padding:.
|
45 |
table{width:100%;border-collapse:collapse}
|
46 |
-
th,td{padding:.
|
47 |
th{background:var(--card);color:var(--accent)}
|
48 |
tr:nth-child(even){background:#101010}
|
49 |
.mermaid{background:var(--card);padding:1rem;border-radius:.55rem}
|
@@ -58,121 +61,104 @@
|
|
58 |
<header class="text-center section">
|
59 |
<h1>XTTVS-MED Demo Suite</h1>
|
60 |
<p class="lead fw-semibold">
|
61 |
-
|
62 |
-
|
63 |
</p>
|
64 |
<p><strong>Chris Coleman</strong> β CEO / CTO Β· GhostAI Labs<br>
|
65 |
<strong>Dr. Anthony Becker MD</strong> β Medical Advisor</p>
|
66 |
</header>
|
67 |
|
68 |
-
<!-- 1 -->
|
69 |
<section class="section">
|
70 |
-
<h2>1. Whatβs
|
71 |
<div class="panel">
|
72 |
<ul class="mb-0">
|
73 |
-
<li>π
|
74 |
-
<li>βοΈ
|
75 |
-
<li>π©Ί
|
76 |
</ul>
|
77 |
</div>
|
78 |
</section>
|
79 |
|
80 |
-
<!-- 2
|
81 |
<section class="section">
|
82 |
-
<h2>2. π¬ Demo Videos</h2>
|
83 |
|
84 |
-
<h3 class="mt-4">2.1
|
85 |
-
<div class="ratio ratio-16x9 mb-3">
|
86 |
-
|
87 |
-
</div>
|
88 |
-
<p class="small text-center">Direct link: <a href="https://streamable.com/bh1eff" target="_blank">streamable.com/bh1eff</a></p>
|
89 |
|
90 |
-
<h3 class="mt-5">2.2
|
91 |
-
<div class="ratio ratio-16x9 mb-3">
|
92 |
-
|
93 |
-
</div>
|
94 |
-
<p class="small text-center">Direct link: <a href="https://streamable.com/ryo2fv" target="_blank">streamable.com/ryo2fv</a></p>
|
95 |
</section>
|
96 |
|
97 |
-
<!-- 3
|
98 |
<section class="section">
|
99 |
-
<h2>3.
|
100 |
<div class="mermaid">
|
101 |
-
|
102 |
-
|
103 |
-
participant FE as JS Front-End
|
104 |
-
participant ASR as Whisper ASR
|
105 |
-
participant MT as Translator
|
106 |
-
participant TTS as XTTS v2
|
107 |
-
Mic-->>FE: audio chunks
|
108 |
-
FE->>ASR: /asr (stream)
|
109 |
-
ASR-->>FE: text (EN)
|
110 |
-
FE->>MT: /translate
|
111 |
-
MT-->>FE: text (target)
|
112 |
-
FE->>TTS: /voice
|
113 |
-
TTS-->>FE: mp3
|
114 |
-
FE-->>Mic: play
|
115 |
</div>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
116 |
</section>
|
117 |
|
118 |
-
<!--
|
119 |
<section class="section">
|
120 |
-
<h2>
|
121 |
-
<
|
122 |
-
|
123 |
-
|
124 |
-
|
125 |
-
|
126 |
-
|
127 |
-
|
128 |
-
|
129 |
-
const mp3 = await fetch('/voice',{
|
130 |
-
method:'POST',headers:{'Content-Type':'application/json'},
|
131 |
-
body:JSON.stringify({text:translated_text,speaker:'Emmas',speed:1.0,language:targetLang})
|
132 |
-
}).then(r=>r.blob());
|
133 |
-
|
134 |
-
new Audio(URL.createObjectURL(mp3)).play();
|
135 |
-
}
|
136 |
-
</pre>
|
137 |
</section>
|
138 |
|
139 |
-
<!--
|
140 |
<section class="section">
|
141 |
-
<h2>
|
142 |
<div class="panel">
|
143 |
-
<
|
144 |
-
<
|
145 |
-
|
146 |
-
|
147 |
-
|
148 |
-
|
149 |
-
}</pre>
|
150 |
-
<p class="mb-0"><strong>Response:</strong> <em>audio/mpeg</em> (β 170 kB)</p>
|
151 |
</div>
|
152 |
</section>
|
153 |
|
154 |
-
<!--
|
155 |
<section class="section">
|
156 |
-
<h2>
|
157 |
<table>
|
158 |
-
<tr><th>
|
159 |
-
<tr><td>
|
160 |
-
<tr><td>Tele-ICU</td><td>
|
161 |
-
<tr><td>
|
162 |
-
<tr><td>
|
163 |
-
<tr><td>
|
164 |
-
<tr><td>
|
165 |
-
<tr><td>
|
166 |
</table>
|
167 |
</section>
|
168 |
|
169 |
-
<!--
|
170 |
<section class="section">
|
171 |
-
<h2>
|
172 |
<ul>
|
173 |
-
<li>π <a href="https://huggingface.co/spaces/ghostai1/GHOSTVOICECBR" target="_blank">
|
174 |
-
<li>π
|
175 |
-
<li>π
|
176 |
</ul>
|
177 |
</section>
|
178 |
|
@@ -182,7 +168,6 @@ async function autoTranslateSpeak(text, targetLang){
|
|
182 |
</footer>
|
183 |
|
184 |
</div>
|
185 |
-
|
186 |
<script src="https://cdn.jsdelivr.net/npm/[email protected]/dist/js/bootstrap.bundle.min.js"></script>
|
187 |
</body>
|
188 |
</html>
|
|
|
3 |
<head>
|
4 |
<meta charset="UTF-8" />
|
5 |
<meta name="viewport" content="width=device-width, initial-scale=1" />
|
6 |
+
<title>XTTVS-MED | End-to-End Multilingual Voice-to-Voice Demo Suite</title>
|
7 |
|
8 |
<!-- Bootstrap -->
|
9 |
+
<link
|
10 |
+
href="https://cdn.jsdelivr.net/npm/[email protected]/dist/css/bootstrap.min.css"
|
11 |
+
rel="stylesheet"
|
12 |
+
/>
|
13 |
|
14 |
<!-- Mermaid -->
|
15 |
<script src="https://cdn.jsdelivr.net/npm/mermaid@10/dist/mermaid.min.js"></script>
|
16 |
<script>
|
17 |
mermaid.initialize({
|
18 |
+
startOnLoad: true,
|
19 |
+
theme: 'dark',
|
20 |
+
flowchart: { fontSize: '16px' },
|
21 |
+
sequence: { actorFontSize: '14px' }
|
22 |
});
|
23 |
</script>
|
24 |
|
25 |
<style>
|
26 |
:root{
|
27 |
+
--bg:#070707; --panel:#111; --card:#181818;
|
28 |
+
--txt:#e5e5e5; --accent:#00e5ff; --sub:#88f0ff;
|
29 |
}
|
30 |
*{box-sizing:border-box}
|
31 |
body{margin:0;background:var(--bg);color:var(--txt);font-family:'Fira Code',monospace}
|
|
|
33 |
h1,h2,h3{color:var(--accent)}
|
34 |
.container-lg{max-width:1160px;padding:2rem 1rem}
|
35 |
.section{margin-bottom:3.2rem}
|
36 |
+
.panel{background:var(--panel);padding:1.3rem;border-radius:.65rem}
|
37 |
+
/* 100 % width, generous padding, horizontal scroll */
|
38 |
pre{
|
39 |
background:var(--card);
|
40 |
color:#c0f6ff;
|
41 |
+
padding:1.1rem 1.6rem;
|
42 |
border-radius:.55rem;
|
43 |
font-size:.9rem;
|
44 |
overflow-x:auto;
|
45 |
+
margin:1.6rem 0;
|
46 |
}
|
47 |
+
code{background:#222;padding:.25rem .45rem;border-radius:.3rem}
|
48 |
table{width:100%;border-collapse:collapse}
|
49 |
+
th,td{padding:.8rem;border:1px solid #272727}
|
50 |
th{background:var(--card);color:var(--accent)}
|
51 |
tr:nth-child(even){background:#101010}
|
52 |
.mermaid{background:var(--card);padding:1rem;border-radius:.55rem}
|
|
|
61 |
<header class="text-center section">
|
62 |
<h1>XTTVS-MED Demo Suite</h1>
|
63 |
<p class="lead fw-semibold">
|
64 |
+
Whisper β Auto-Translate β 4-bit XTTSv2 cloning in under 1 s<br>
|
65 |
+
(English β
Arabic β
Spanish β
French)
|
66 |
</p>
|
67 |
<p><strong>Chris Coleman</strong> β CEO / CTO Β· GhostAI Labs<br>
|
68 |
<strong>Dr. Anthony Becker MD</strong> β Medical Advisor</p>
|
69 |
</header>
|
70 |
|
71 |
+
<!-- 1 Β· Overview -->
|
72 |
<section class="section">
|
73 |
+
<h2>1. Whatβs new in v2 (front-end + white-paper extras)</h2>
|
74 |
<div class="panel">
|
75 |
<ul class="mb-0">
|
76 |
+
<li>π 4-language front-end walk-through <em>and</em> back-end latency video.</li>
|
77 |
+
<li>βοΈ New PDF-derived sections: Time-over-Wavelength cloning, FloatBin scheduler, quant-eq, hardware table, clinical data.</li>
|
78 |
+
<li>π©Ί Improves patient survival by <strong>10β15 %</strong> via sub-second translation :contentReference[oaicite:0]{index=0}.</li>
|
79 |
</ul>
|
80 |
</div>
|
81 |
</section>
|
82 |
|
83 |
+
<!-- 2 Β· Videos -->
|
84 |
<section class="section">
|
85 |
+
<h2>2. π¬ Live Demo Videos</h2>
|
86 |
|
87 |
+
<h3 class="mt-4">2.1 β’ Front-End Walk-Through (4 Languages)</h3>
|
88 |
+
<div class="ratio ratio-16x9 mb-3"><iframe src="https://streamable.com/e/bh1eff" allowfullscreen></iframe></div>
|
89 |
+
<p class="small text-center">Link β <a href="https://streamable.com/bh1eff" target="_blank">streamable.com/bh1eff</a></p>
|
|
|
|
|
90 |
|
91 |
+
<h3 class="mt-5">2.2 β’ Back-End Hardware / Latency</h3>
|
92 |
+
<div class="ratio ratio-16x9 mb-3"><iframe src="https://streamable.com/e/ryo2fv" allowfullscreen></iframe></div>
|
93 |
+
<p class="small text-center">Link β <a href="https://streamable.com/ryo2fv" target="_blank">streamable.com/ryo2fv</a></p>
|
|
|
|
|
94 |
</section>
|
95 |
|
96 |
+
<!-- 3 Β· Architecture (with time-over-wavelength) -->
|
97 |
<section class="section">
|
98 |
+
<h2>3. Time-over-Wavelength Voice-Cloning Pipeline</h2>
|
99 |
<div class="mermaid">
|
100 |
+
graph TD
|
101 |
+
A["Input<br>Waveform"] --> B["Time-Wavelength<br>Decomposition"] --> C["Semantic Vectors"] --> D["FloatBin Tree<br>Scheduler"] --> E["XTTSv2 (INT4)"] --> F["Cloned<br>Output"]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
102 |
</div>
|
103 |
+
<p class="small">Pipeline summarised from Fig. 1 in the white paper :contentReference[oaicite:1]{index=1}.</p>
|
104 |
+
</section>
|
105 |
+
|
106 |
+
<!-- 4 Β· Quantization Equation -->
|
107 |
+
<section class="section">
|
108 |
+
<h2>4. 4-Bit FloatBin Quantization<br><span class="fs-6 text-muted">(reduces VRAM β₯ 5Γ)</span></h2>
|
109 |
+
<pre><code>x<sub>quant</sub> = round( (x β x<sub>min</sub>) / (x<sub>max</sub> β x<sub>min</sub>) Β· (2<sup>4</sup>β1) )
|
110 |
+
Β· (x<sub>max</sub> β x<sub>min</sub>) / (2<sup>4</sup>β1) + x<sub>min</sub></code></pre>
|
111 |
+
<p class="small mb-0">Enables deployment on 6 GB consumer GPUs while sustaining < 0.8 s latency :contentReference[oaicite:2]{index=2}.</p>
|
112 |
</section>
|
113 |
|
114 |
+
<!-- 5 Β· Hardware scalability -->
|
115 |
<section class="section">
|
116 |
+
<h2>5. Hardware Benchmarks</h2>
|
117 |
+
<table>
|
118 |
+
<tr><th>System</th><th>Compute</th><th>VRAM</th><th>Latency (250 chars)</th><th>Concurrent Streams</th></tr>
|
119 |
+
<tr><td>Pi 5 + Edge TPU</td><td>26 TFLOPS (INT8)</td><td>β</td><td>3.2 s</td><td>1β2</td></tr>
|
120 |
+
<tr><td>RTX 2080</td><td>13.4 TFLOPS (FP16)</td><td>8 GB</td><td>1.2 s</td><td>3β4</td></tr>
|
121 |
+
<tr><td>DGX A100</td><td>1 000 TFLOPS (FP16)</td><td>128 GB</td><td>0.4 s</td><td>20β30</td></tr>
|
122 |
+
<tr><td>HF200 Hospital Cluster</td><td>2 000 TFLOPS</td><td>256 GB</td><td>0.2 s</td><td>40β50 +</td></tr>
|
123 |
+
</table>
|
124 |
+
<p class="small">Table adapted from white-paper benchmarks :contentReference[oaicite:3]{index=3}.</p>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
125 |
</section>
|
126 |
|
127 |
+
<!-- 6 Β· Clinical validation -->
|
128 |
<section class="section">
|
129 |
+
<h2>6. Clinical Validation & Stats</h2>
|
130 |
<div class="panel">
|
131 |
+
<ul class="mb-0">
|
132 |
+
<li>600 h labeled clinical audio; MOS β₯ 4.5 for intelligibility :contentReference[oaicite:4]{index=4}.</li>
|
133 |
+
<li>ANOVA on response-latency (p < 0.01).</li>
|
134 |
+
<li>Every 1 s saved in ER comms β ~7 % mortality reduction.</li>
|
135 |
+
<li>XTTVS-MED sub-second pipeline β 10β15 % survival uplift.</li>
|
136 |
+
</ul>
|
|
|
|
|
137 |
</div>
|
138 |
</section>
|
139 |
|
140 |
+
<!-- 7 Β· Expanded use-case table -->
|
141 |
<section class="section">
|
142 |
+
<h2>7. Expanded Use-Case Matrix</h2>
|
143 |
<table>
|
144 |
+
<tr><th>Sector</th><th>Example Workflow</th><th>Value Add</th></tr>
|
145 |
+
<tr><td>Emergency Care</td><td>Trauma bay commands auto-voiced in patientβs language</td><td>Reduce critical-path delay</td></tr>
|
146 |
+
<tr><td>Tele-ICU</td><td>Cross-border staff get real-time captions + cloned voice</td><td>Lower staff ratio, fewer errors</td></tr>
|
147 |
+
<tr><td>Post-Op Care</td><td>Personalised discharge instructions via bedside tablet</td><td>β compliance, β readmissions</td></tr>
|
148 |
+
<tr><td>Pharmacy</td><td>Kiosk prints label + speaks dosage directions</td><td>Better adherence for low-literacy patients</td></tr>
|
149 |
+
<tr><td>Mental-Health</td><td>Crisis hotline auto-interprets & mirrors counsellor tone</td><td>Instant rapport across languages</td></tr>
|
150 |
+
<tr><td>Clinical Training</td><td>Procedures auto-narrated in traineeβs language</td><td>Scalable global curriculum</td></tr>
|
151 |
+
<tr><td>Legal Consent</td><td>Forms read aloud, signed digitally</td><td>Stronger informed-consent audit trail</td></tr>
|
152 |
</table>
|
153 |
</section>
|
154 |
|
155 |
+
<!-- 8 Β· Resources -->
|
156 |
<section class="section">
|
157 |
+
<h2>8. Resources</h2>
|
158 |
<ul>
|
159 |
+
<li>π Live Space β <a href="https://huggingface.co/spaces/ghostai1/GHOSTVOICECBR" target="_blank">huggingface.co/spaces/ghostai1/GHOSTVOICECBR</a></li>
|
160 |
+
<li>π White Paper β ghostcbrwpaper2025.pdf</li>
|
161 |
+
<li>π Market Brief β marketAImed.pdf</li>
|
162 |
</ul>
|
163 |
</section>
|
164 |
|
|
|
168 |
</footer>
|
169 |
|
170 |
</div>
|
|
|
171 |
<script src="https://cdn.jsdelivr.net/npm/[email protected]/dist/js/bootstrap.bundle.min.js"></script>
|
172 |
</body>
|
173 |
</html>
|