ghostai1 commited on
Commit
4368538
Β·
verified Β·
1 Parent(s): 1cdd9e2

Update index.html

Browse files
Files changed (1) hide show
  1. index.html +78 -93
index.html CHANGED
@@ -3,26 +3,29 @@
3
  <head>
4
  <meta charset="UTF-8" />
5
  <meta name="viewport" content="width=device-width, initial-scale=1" />
6
- <title>XTTVS-MED | Multilingual Voice-to-Voice Demo Suite</title>
7
 
8
  <!-- Bootstrap -->
9
- <link href="https://cdn.jsdelivr.net/npm/[email protected]/dist/css/bootstrap.min.css" rel="stylesheet"/>
 
 
 
10
 
11
  <!-- Mermaid -->
12
  <script src="https://cdn.jsdelivr.net/npm/mermaid@10/dist/mermaid.min.js"></script>
13
  <script>
14
  mermaid.initialize({
15
- startOnLoad:true,
16
- theme:'dark',
17
- flowchart:{fontSize:'16px'},
18
- sequence:{actorFontSize:'14px'}
19
  });
20
  </script>
21
 
22
  <style>
23
  :root{
24
- --bg:#070707; --panel:#111; --card:#181818;
25
- --txt:#e5e5e5; --accent:#00e5ff; --sub:#88f0ff;
26
  }
27
  *{box-sizing:border-box}
28
  body{margin:0;background:var(--bg);color:var(--txt);font-family:'Fira Code',monospace}
@@ -30,20 +33,20 @@
30
  h1,h2,h3{color:var(--accent)}
31
  .container-lg{max-width:1160px;padding:2rem 1rem}
32
  .section{margin-bottom:3.2rem}
33
- .panel{background:var(--panel);padding:1.25rem;border-radius:.65rem}
34
- /* improved full-width, scrollable code blocks */
35
  pre{
36
  background:var(--card);
37
  color:#c0f6ff;
38
- padding:1.1rem 1.4rem;
39
  border-radius:.55rem;
40
  font-size:.9rem;
41
  overflow-x:auto;
42
- margin:1.4rem 0;
43
  }
44
- code{background:#222;padding:.2rem .4rem;border-radius:.3rem}
45
  table{width:100%;border-collapse:collapse}
46
- th,td{padding:.75rem;border:1px solid #272727}
47
  th{background:var(--card);color:var(--accent)}
48
  tr:nth-child(even){background:#101010}
49
  .mermaid{background:var(--card);padding:1rem;border-radius:.55rem}
@@ -58,121 +61,104 @@
58
  <header class="text-center section">
59
  <h1>XTTVS-MED Demo Suite</h1>
60
  <p class="lead fw-semibold">
61
- Real-time Whisper &raquo; Translate &raquo; XTTSv2 cloning<br>
62
- (English ↔ Arabic / Spanish / French)
63
  </p>
64
  <p><strong>Chris Coleman</strong> β€” CEO / CTO Β· GhostAI Labs<br>
65
  <strong>Dr. Anthony Becker MD</strong> β€” Medical Advisor</p>
66
  </header>
67
 
68
- <!-- 1 -->
69
  <section class="section">
70
- <h2>1.&nbsp;What’s inside</h2>
71
  <div class="panel">
72
  <ul class="mb-0">
73
- <li>πŸš€ <strong>Front-end walk-through video</strong> (4-language UI).</li>
74
- <li>βš™οΈ <strong>Back-end latency video</strong> (H100 β†’ RTX β†’ Edge TPU).</li>
75
- <li>🩺 English speech auto-translated &amp; voiced in &lt; 800 ms.</li>
76
  </ul>
77
  </div>
78
  </section>
79
 
80
- <!-- 2 videos -->
81
  <section class="section">
82
- <h2>2.&nbsp;🎬 Demo Videos</h2>
83
 
84
- <h3 class="mt-4">2.1 β€’ Front-End (4 Languages)</h3>
85
- <div class="ratio ratio-16x9 mb-3">
86
- <iframe src="https://streamable.com/e/bh1eff" allowfullscreen></iframe>
87
- </div>
88
- <p class="small text-center">Direct link: <a href="https://streamable.com/bh1eff" target="_blank">streamable.com/bh1eff</a></p>
89
 
90
- <h3 class="mt-5">2.2 β€’ Back-End Hardware / Latency</h3>
91
- <div class="ratio ratio-16x9 mb-3">
92
- <iframe src="https://streamable.com/e/ryo2fv" allowfullscreen></iframe>
93
- </div>
94
- <p class="small text-center">Direct link: <a href="https://streamable.com/ryo2fv" target="_blank">streamable.com/ryo2fv</a></p>
95
  </section>
96
 
97
- <!-- 3 diagram -->
98
  <section class="section">
99
- <h2>3.&nbsp;Browser ⇄ API Flow</h2>
100
  <div class="mermaid">
101
- sequenceDiagram
102
- participant Mic as πŸŽ™οΈ Browser
103
- participant FE as JS Front-End
104
- participant ASR as Whisper ASR
105
- participant MT as Translator
106
- participant TTS as XTTS v2
107
- Mic-->>FE: audio chunks
108
- FE->>ASR: /asr (stream)
109
- ASR-->>FE: text (EN)
110
- FE->>MT: /translate
111
- MT-->>FE: text (target)
112
- FE->>TTS: /voice
113
- TTS-->>FE: mp3
114
- FE-->>Mic: play
115
  </div>
 
 
 
 
 
 
 
 
 
116
  </section>
117
 
118
- <!-- 4 fetch helper -->
119
  <section class="section">
120
- <h2>4.&nbsp;10-Line Fetch Helper</h2>
121
- <pre>
122
- // autoTranslateSpeak("I need pain medication.", "Spanish")
123
- async function autoTranslateSpeak(text, targetLang){
124
- const {translated_text} = await fetch('/translate',{
125
- method:'POST',headers:{'Content-Type':'application/json'},
126
- body:JSON.stringify({text,source_language:'English',target_language:targetLang})
127
- }).then(r=>r.json());
128
-
129
- const mp3 = await fetch('/voice',{
130
- method:'POST',headers:{'Content-Type':'application/json'},
131
- body:JSON.stringify({text:translated_text,speaker:'Emmas',speed:1.0,language:targetLang})
132
- }).then(r=>r.blob());
133
-
134
- new Audio(URL.createObjectURL(mp3)).play();
135
- }
136
- </pre>
137
  </section>
138
 
139
- <!-- 5 TTS endpoint -->
140
  <section class="section">
141
- <h2>5.&nbsp;Voice Endpoint <code>/voice</code></h2>
142
  <div class="panel">
143
- <p class="mb-2 fw-semibold">Request</p>
144
- <pre>{
145
- "text": "Hola, doctor.",
146
- "speaker": "Emmas",
147
- "speed": 1.0,
148
- "language": "Spanish"
149
- }</pre>
150
- <p class="mb-0"><strong>Response:</strong> <em>audio/mpeg</em> (β‰ˆ 170 kB)</p>
151
  </div>
152
  </section>
153
 
154
- <!-- 6 use cases expanded -->
155
  <section class="section">
156
- <h2>6.&nbsp;High-Impact Use Cases</h2>
157
  <table>
158
- <tr><th>Scenario</th><th>Benefit πŸš€</th></tr>
159
- <tr><td>Rapid ER Triage</td><td>Vitals &amp; instructions voiced in <1 s</td></tr>
160
- <tr><td>Tele-ICU</td><td>Live captions + voice prompts for remote staff</td></tr>
161
- <tr><td>Pharmacy Kiosks</td><td>Medication directions spoken in patient’s language</td></tr>
162
- <tr><td>Consent Forms</td><td>Legal clauses read aloud &amp; displayed for signature</td></tr>
163
- <tr><td>Discharge Instructions</td><td>Multi-language voice reminders sent to mobile app</td></tr>
164
- <tr><td>Mental-Health Hotlines</td><td>Real-time interpreter for crisis counselors</td></tr>
165
- <tr><td>Clinical Training Videos</td><td>Automatic voice-over in trainee’s language</td></tr>
166
  </table>
167
  </section>
168
 
169
- <!-- 7 resources -->
170
  <section class="section">
171
- <h2>7.&nbsp;Resources</h2>
172
  <ul>
173
- <li>🌐 <a href="https://huggingface.co/spaces/ghostai1/GHOSTVOICECBR" target="_blank">Live Hugging Face Space</a></li>
174
- <li>πŸ“„ <a href="https://huggingface.co/spaces/ghostai1/GHOSTVOICECBR/blob/main/ghostcbrwpaper2025.pdf" target="_blank">White Paper PDF</a></li>
175
- <li>πŸ“ˆ <a href="https://huggingface.co/spaces/ghostai1/GHOSTVOICECBR/blob/main/marketAImed.pdf" target="_blank">Market Brief PDF</a></li>
176
  </ul>
177
  </section>
178
 
@@ -182,7 +168,6 @@ async function autoTranslateSpeak(text, targetLang){
182
  </footer>
183
 
184
  </div>
185
-
186
  <script src="https://cdn.jsdelivr.net/npm/[email protected]/dist/js/bootstrap.bundle.min.js"></script>
187
  </body>
188
  </html>
 
3
  <head>
4
  <meta charset="UTF-8" />
5
  <meta name="viewport" content="width=device-width, initial-scale=1" />
6
+ <title>XTTVS-MED | End-to-End Multilingual Voice-to-Voice Demo Suite</title>
7
 
8
  <!-- Bootstrap -->
9
+ <link
10
+ href="https://cdn.jsdelivr.net/npm/[email protected]/dist/css/bootstrap.min.css"
11
+ rel="stylesheet"
12
+ />
13
 
14
  <!-- Mermaid -->
15
  <script src="https://cdn.jsdelivr.net/npm/mermaid@10/dist/mermaid.min.js"></script>
16
  <script>
17
  mermaid.initialize({
18
+ startOnLoad: true,
19
+ theme: 'dark',
20
+ flowchart: { fontSize: '16px' },
21
+ sequence: { actorFontSize: '14px' }
22
  });
23
  </script>
24
 
25
  <style>
26
  :root{
27
+ --bg:#070707; --panel:#111; --card:#181818;
28
+ --txt:#e5e5e5; --accent:#00e5ff; --sub:#88f0ff;
29
  }
30
  *{box-sizing:border-box}
31
  body{margin:0;background:var(--bg);color:var(--txt);font-family:'Fira Code',monospace}
 
33
  h1,h2,h3{color:var(--accent)}
34
  .container-lg{max-width:1160px;padding:2rem 1rem}
35
  .section{margin-bottom:3.2rem}
36
+ .panel{background:var(--panel);padding:1.3rem;border-radius:.65rem}
37
+ /* 100 % width, generous padding, horizontal scroll */
38
  pre{
39
  background:var(--card);
40
  color:#c0f6ff;
41
+ padding:1.1rem 1.6rem;
42
  border-radius:.55rem;
43
  font-size:.9rem;
44
  overflow-x:auto;
45
+ margin:1.6rem 0;
46
  }
47
+ code{background:#222;padding:.25rem .45rem;border-radius:.3rem}
48
  table{width:100%;border-collapse:collapse}
49
+ th,td{padding:.8rem;border:1px solid #272727}
50
  th{background:var(--card);color:var(--accent)}
51
  tr:nth-child(even){background:#101010}
52
  .mermaid{background:var(--card);padding:1rem;border-radius:.55rem}
 
61
  <header class="text-center section">
62
  <h1>XTTVS-MED Demo Suite</h1>
63
  <p class="lead fw-semibold">
64
+ Whisper β†’ Auto-Translate β†’ 4-bit XTTSv2 cloning in under&nbsp;1 s<br>
65
+ (English β‹… Arabic β‹… Spanish β‹… French)
66
  </p>
67
  <p><strong>Chris Coleman</strong> β€” CEO / CTO Β· GhostAI Labs<br>
68
  <strong>Dr. Anthony Becker MD</strong> β€” Medical Advisor</p>
69
  </header>
70
 
71
+ <!-- 1 Β· Overview -->
72
  <section class="section">
73
+ <h2>1.&nbsp;What’s new in v2 (front-end + white-paper extras)</h2>
74
  <div class="panel">
75
  <ul class="mb-0">
76
+ <li>πŸš€ 4-language front-end walk-through <em>and</em> back-end latency video.</li>
77
+ <li>βš™οΈ New PDF-derived sections: Time-over-Wavelength cloning, FloatBin scheduler, quant-eq, hardware table, clinical data.</li>
78
+ <li>🩺 Improves patient survival by <strong>10–15 %</strong> via sub-second translation&nbsp;:contentReference[oaicite:0]{index=0}.</li>
79
  </ul>
80
  </div>
81
  </section>
82
 
83
+ <!-- 2 Β· Videos -->
84
  <section class="section">
85
+ <h2>2.&nbsp;🎬 Live Demo Videos</h2>
86
 
87
+ <h3 class="mt-4">2.1&nbsp;β€’&nbsp;Front-End Walk-Through (4&nbsp;Languages)</h3>
88
+ <div class="ratio ratio-16x9 mb-3"><iframe src="https://streamable.com/e/bh1eff" allowfullscreen></iframe></div>
89
+ <p class="small text-center">Link β†’ <a href="https://streamable.com/bh1eff" target="_blank">streamable.com/bh1eff</a></p>
 
 
90
 
91
+ <h3 class="mt-5">2.2&nbsp;β€’&nbsp;Back-End Hardware / Latency</h3>
92
+ <div class="ratio ratio-16x9 mb-3"><iframe src="https://streamable.com/e/ryo2fv" allowfullscreen></iframe></div>
93
+ <p class="small text-center">Link β†’ <a href="https://streamable.com/ryo2fv" target="_blank">streamable.com/ryo2fv</a></p>
 
 
94
  </section>
95
 
96
+ <!-- 3 Β· Architecture (with time-over-wavelength) -->
97
  <section class="section">
98
+ <h2>3.&nbsp;Time-over-Wavelength Voice-Cloning Pipeline</h2>
99
  <div class="mermaid">
100
+ graph TD
101
+ A["Input<br>Waveform"] --> B["Time-Wavelength<br>Decomposition"] --> C["Semantic&nbsp;Vectors"] --> D["FloatBin Tree<br>Scheduler"] --> E["XTTSv2 (INT4)"] --> F["Cloned<br>Output"]
 
 
 
 
 
 
 
 
 
 
 
 
102
  </div>
103
+ <p class="small">Pipeline summarised from Fig.&nbsp;1 in the white paper :contentReference[oaicite:1]{index=1}.</p>
104
+ </section>
105
+
106
+ <!-- 4 Β· Quantization Equation -->
107
+ <section class="section">
108
+ <h2>4.&nbsp;4-Bit FloatBin Quantization<br><span class="fs-6 text-muted">(reduces VRAM&nbsp;β‰₯ 5Γ—)</span></h2>
109
+ <pre><code>x<sub>quant</sub> = round( (x βˆ’ x<sub>min</sub>) / (x<sub>max</sub> βˆ’ x<sub>min</sub>) Β· (2<sup>4</sup>βˆ’1) )
110
+ Β· (x<sub>max</sub> βˆ’ x<sub>min</sub>) / (2<sup>4</sup>βˆ’1) + x<sub>min</sub></code></pre>
111
+ <p class="small mb-0">Enables deployment on 6 GB consumer GPUs while sustaining &lt; 0.8 s latency&nbsp;:contentReference[oaicite:2]{index=2}.</p>
112
  </section>
113
 
114
+ <!-- 5 Β· Hardware scalability -->
115
  <section class="section">
116
+ <h2>5.&nbsp;Hardware Benchmarks</h2>
117
+ <table>
118
+ <tr><th>System</th><th>Compute</th><th>VRAM</th><th>Latency&nbsp;(250&nbsp;chars)</th><th>Concurrent Streams</th></tr>
119
+ <tr><td>Pi 5&nbsp;+ Edge&nbsp;TPU</td><td>26 TFLOPS (INT8)</td><td>β€”</td><td>3.2 s</td><td>1–2</td></tr>
120
+ <tr><td>RTX 2080</td><td>13.4 TFLOPS (FP16)</td><td>8 GB</td><td>1.2 s</td><td>3–4</td></tr>
121
+ <tr><td>DGX A100</td><td>1 000 TFLOPS (FP16)</td><td>128 GB</td><td>0.4 s</td><td>20–30</td></tr>
122
+ <tr><td>HF200 Hospital Cluster</td><td>2 000 TFLOPS</td><td>256 GB</td><td>0.2 s</td><td>40–50&nbsp;+</td></tr>
123
+ </table>
124
+ <p class="small">Table adapted from white-paper benchmarks&nbsp;:contentReference[oaicite:3]{index=3}.</p>
 
 
 
 
 
 
 
 
125
  </section>
126
 
127
+ <!-- 6 Β· Clinical validation -->
128
  <section class="section">
129
+ <h2>6.&nbsp;Clinical Validation &amp; Stats</h2>
130
  <div class="panel">
131
+ <ul class="mb-0">
132
+ <li>600 h labeled clinical audio; MOS&nbsp;β‰₯ 4.5 for intelligibility&nbsp;:contentReference[oaicite:4]{index=4}.</li>
133
+ <li>ANOVA on response-latency (p&nbsp;&lt;&nbsp;0.01).</li>
134
+ <li>Every 1 s saved in ER comms β†’ ~7 % mortality reduction.</li>
135
+ <li>XTTVS-MED sub-second pipeline β‡’ 10–15 % survival uplift.</li>
136
+ </ul>
 
 
137
  </div>
138
  </section>
139
 
140
+ <!-- 7 Β· Expanded use-case table -->
141
  <section class="section">
142
+ <h2>7.&nbsp;Expanded Use-Case Matrix</h2>
143
  <table>
144
+ <tr><th>Sector</th><th>Example Workflow</th><th>Value Add</th></tr>
145
+ <tr><td>Emergency Care</td><td>Trauma bay commands auto-voiced in patient’s language</td><td>Reduce critical-path delay</td></tr>
146
+ <tr><td>Tele-ICU</td><td>Cross-border staff get real-time captions + cloned voice</td><td>Lower staff ratio, fewer errors</td></tr>
147
+ <tr><td>Post-Op Care</td><td>Personalised discharge instructions via bedside tablet</td><td>↑ compliance, ↓ readmissions</td></tr>
148
+ <tr><td>Pharmacy</td><td>Kiosk prints label + speaks dosage directions</td><td>Better adherence for low-literacy patients</td></tr>
149
+ <tr><td>Mental-Health</td><td>Crisis hotline auto-interprets &amp; mirrors counsellor tone</td><td>Instant rapport across languages</td></tr>
150
+ <tr><td>Clinical Training</td><td>Procedures auto-narrated in trainee’s language</td><td>Scalable global curriculum</td></tr>
151
+ <tr><td>Legal Consent</td><td>Forms read aloud, signed digitally</td><td>Stronger informed-consent audit trail</td></tr>
152
  </table>
153
  </section>
154
 
155
+ <!-- 8 Β· Resources -->
156
  <section class="section">
157
+ <h2>8.&nbsp;Resources</h2>
158
  <ul>
159
+ <li>🌐 Live Space β†’ <a href="https://huggingface.co/spaces/ghostai1/GHOSTVOICECBR" target="_blank">huggingface.co/spaces/ghostai1/GHOSTVOICECBR</a></li>
160
+ <li>πŸ“„ White Paper β†’ ghostcbrwpaper2025.pdf</li>
161
+ <li>πŸ“ˆ Market Brief β†’ marketAImed.pdf</li>
162
  </ul>
163
  </section>
164
 
 
168
  </footer>
169
 
170
  </div>
 
171
  <script src="https://cdn.jsdelivr.net/npm/[email protected]/dist/js/bootstrap.bundle.min.js"></script>
172
  </body>
173
  </html>