This commit adds a real-time interpreter mode to the Voice Language Translator: - Implements continuous speech-to-translation capabilities using WebSockets - Adds background processing threads for audio, transcription, and TTS - Adds client-side speech detection and streaming - Updates UI to include real-time interpreter controls - Adds necessary dependencies (flask-socketio, eventlet)
243 lines
11 KiB
HTML
243 lines
11 KiB
HTML
<!DOCTYPE html>
|
|
<html lang="en">
|
|
<head>
|
|
<meta charset="UTF-8">
|
|
<meta name="viewport" content="width=device-width, initial-scale=1.0, user-scalable=no">
|
|
<title>Voice Language Translator</title>
|
|
<link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0-alpha1/dist/css/bootstrap.min.css" rel="stylesheet">
|
|
<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.0.0/css/all.min.css">
|
|
<link rel="icon" href="/favicon.ico" sizes="any">
|
|
<link rel="apple-touch-icon" href="/static/icons/apple-icon-180x180.png">
|
|
<link rel="apple-touch-icon" sizes="152x152" href="/static/icons/apple-icon-152x152.png">
|
|
<link rel="apple-touch-icon" sizes="180x180" href="/static/icons/apple-icon-180x180.png">
|
|
<link rel="apple-touch-icon" sizes="167x167" href="/static/icons/apple-icon-167x167.png">
|
|
<!-- Add Socket.IO client library -->
|
|
<script src="https://cdn.socket.io/4.6.0/socket.io.min.js"></script>
|
|
<style>
|
|
body {
|
|
padding-top: 20px;
|
|
padding-bottom: 20px;
|
|
background-color: #f8f9fa;
|
|
}
|
|
.record-btn {
|
|
width: 80px;
|
|
height: 80px;
|
|
border-radius: 50%; /* This makes the button circular */
|
|
display: flex;
|
|
align-items: center;
|
|
justify-content: center;
|
|
font-size: 32px;
|
|
margin: 20px auto;
|
|
box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1);
|
|
transition: all 0.3s;
|
|
padding: 0; /* Remove padding to ensure perfect circle */
|
|
border: none; /* Remove border for cleaner look */
|
|
}
|
|
|
|
.record-btn:active {
|
|
transform: scale(0.95);
|
|
box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);
|
|
}
|
|
|
|
.recording {
|
|
background-color: #dc3545 !important;
|
|
animation: pulse 1.5s infinite;
|
|
}
|
|
.record-btn.btn {
|
|
border-radius: 50% !important;
|
|
line-height: 1;
|
|
}
|
|
@keyframes pulse {
|
|
0% {
|
|
transform: scale(1);
|
|
}
|
|
50% {
|
|
transform: scale(1.05);
|
|
}
|
|
100% {
|
|
transform: scale(1);
|
|
}
|
|
}
|
|
.card {
|
|
border-radius: 15px;
|
|
box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1);
|
|
margin-bottom: 20px;
|
|
}
|
|
.card-header {
|
|
border-radius: 15px 15px 0 0 !important;
|
|
}
|
|
.language-select {
|
|
border-radius: 10px;
|
|
padding: 10px;
|
|
}
|
|
.text-display {
|
|
min-height: 100px;
|
|
padding: 15px;
|
|
background-color: #f8f9fa;
|
|
border-radius: 10px;
|
|
margin-bottom: 15px;
|
|
overflow-y: auto;
|
|
max-height: 300px;
|
|
}
|
|
.btn-action {
|
|
border-radius: 10px;
|
|
padding: 8px 15px;
|
|
margin: 5px;
|
|
}
|
|
.spinner-border {
|
|
width: 1rem;
|
|
height: 1rem;
|
|
margin-right: 5px;
|
|
}
|
|
.status-indicator {
|
|
font-size: 0.9rem;
|
|
font-style: italic;
|
|
color: #6c757d;
|
|
}
|
|
</style>
|
|
|
|
<!-- PWA Meta Tags -->
|
|
<meta name="description" content="Translate spoken language between multiple languages with speech input and output">
|
|
<meta name="theme-color" content="#007bff">
|
|
<meta name="apple-mobile-web-app-capable" content="yes">
|
|
<meta name="apple-mobile-web-app-status-bar-style" content="black-translucent">
|
|
<meta name="apple-mobile-web-app-title" content="Translator">
|
|
|
|
<!-- PWA Icons and Manifest -->
|
|
<link rel="manifest" href="/static/manifest.json">
|
|
<link rel="icon" type="image/png" href="/static/icons/icon-192x192.png">
|
|
<link rel="apple-touch-icon" href="/static/icons/apple-icon-180x180.png">
|
|
|
|
<!-- Apple Splash Screens -->
|
|
<link rel="apple-touch-startup-image" href="/static/splash/apple-splash-2048-2732.png" media="(device-width: 1024px) and (device-height: 1366px) and (-webkit-device-pixel-ratio: 2) and (orientation: portrait)">
|
|
<link rel="apple-touch-startup-image" href="/static/splash/apple-splash-1668-2388.png" media="(device-width: 834px) and (device-height: 1194px) and (-webkit-device-pixel-ratio: 2) and (orientation: portrait)">
|
|
<link rel="apple-touch-startup-image" href="/static/splash/apple-splash-1536-2048.png" media="(device-width: 768px) and (device-height: 1024px) and (-webkit-device-pixel-ratio: 2) and (orientation: portrait)">
|
|
<link rel="apple-touch-startup-image" href="/static/splash/apple-splash-1125-2436.png" media="(device-width: 375px) and (device-height: 812px) and (-webkit-device-pixel-ratio: 3) and (orientation: portrait)">
|
|
<link rel="apple-touch-startup-image" href="/static/splash/apple-splash-1242-2688.png" media="(device-width: 414px) and (device-height: 896px) and (-webkit-device-pixel-ratio: 3) and (orientation: portrait)">
|
|
<link rel="apple-touch-startup-image" href="/static/splash/apple-splash-750-1334.png" media="(device-width: 375px) and (device-height: 667px) and (-webkit-device-pixel-ratio: 2) and (orientation: portrait)">
|
|
<link rel="apple-touch-startup-image" href="/static/splash/apple-splash-640-1136.png" media="(device-width: 320px) and (device-height: 568px) and (-webkit-device-pixel-ratio: 2) and (orientation: portrait)">
|
|
|
|
<!-- Stylesheets -->
|
|
<link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0-alpha1/dist/css/bootstrap.min.css" rel="stylesheet">
|
|
<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.0.0/css/all.min.css">
|
|
<link rel="stylesheet" href="/static/css/styles.css">
|
|
|
|
</head>
|
|
<body>
|
|
<div class="container">
|
|
<h1 class="text-center mb-4">Voice Language Translator</h1>
|
|
<!--<p class="text-center text-muted">Powered by Gemma 3, Whisper & Edge TTS</p>-->
|
|
|
|
<div class="row">
|
|
<div class="col-md-6 mb-3">
|
|
<div class="card">
|
|
<div class="card-header bg-primary text-white">
|
|
<h5 class="mb-0">Source</h5>
|
|
</div>
|
|
<div class="card-body">
|
|
<select id="sourceLanguage" class="form-select language-select mb-3">
|
|
{% for language in languages %}
|
|
<option value="{{ language }}">{{ language }}</option>
|
|
{% endfor %}
|
|
</select>
|
|
<div class="text-display" id="sourceText">
|
|
<p class="text-muted">Your transcribed text will appear here...</p>
|
|
</div>
|
|
<div class="d-flex justify-content-between">
|
|
<button id="playSource" class="btn btn-outline-primary btn-action" disabled>
|
|
<i class="fas fa-play"></i> Play
|
|
</button>
|
|
<button id="clearSource" class="btn btn-outline-secondary btn-action">
|
|
<i class="fas fa-trash"></i> Clear
|
|
</button>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
|
|
<div class="col-md-6 mb-3">
|
|
<div class="card">
|
|
<div class="card-header bg-success text-white">
|
|
<h5 class="mb-0">Translation</h5>
|
|
</div>
|
|
<div class="card-body">
|
|
<select id="targetLanguage" class="form-select language-select mb-3">
|
|
{% for language in languages %}
|
|
<option value="{{ language }}">{{ language }}</option>
|
|
{% endfor %}
|
|
</select>
|
|
<div class="text-display" id="translatedText">
|
|
<p class="text-muted">Translation will appear here...</p>
|
|
</div>
|
|
<div class="d-flex justify-content-between">
|
|
<button id="playTranslation" class="btn btn-outline-success btn-action" disabled>
|
|
<i class="fas fa-play"></i> Play
|
|
</button>
|
|
<button id="clearTranslation" class="btn btn-outline-secondary btn-action">
|
|
<i class="fas fa-trash"></i> Clear
|
|
</button>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
|
|
<div class="text-center">
|
|
<button id="recordBtn" class="btn btn-primary record-btn">
|
|
<i class="fas fa-microphone"></i>
|
|
</button>
|
|
<p class="status-indicator" id="statusIndicator">Click to start recording</p>
|
|
</div>
|
|
|
|
<div class="text-center mt-3">
|
|
<button id="translateBtn" class="btn btn-success" disabled>
|
|
<i class="fas fa-language"></i> Translate
|
|
</button>
|
|
</div>
|
|
|
|
<!-- Add real-time interpreter button -->
|
|
<div class="text-center mt-3">
|
|
<button id="realtimeBtn" class="btn btn-primary">
|
|
<i class="fas fa-language"></i> Start Interpreter
|
|
</button>
|
|
<p class="status-indicator" id="realtimeStatusIndicator">Interpreter ready</p>
|
|
</div>
|
|
|
|
<div class="mt-3">
|
|
<div class="progress d-none" id="progressContainer">
|
|
<div id="progressBar" class="progress-bar progress-bar-striped progress-bar-animated" role="progressbar" style="width: 0%"></div>
|
|
</div>
|
|
</div>
|
|
|
|
<!-- Add explanation of real-time interpreter mode -->
|
|
<div class="row mt-4">
|
|
<div class="col-md-12">
|
|
<div class="card">
|
|
<div class="card-header bg-info text-white">
|
|
<h5 class="mb-0">Real-time Interpretation Mode</h5>
|
|
</div>
|
|
<div class="card-body">
|
|
<p>This mode enables continuous, real-time interpretation as you speak:</p>
|
|
<ul>
|
|
<li><strong>Start Interpreter</strong> - Begin continuous speech interpretation</li>
|
|
<li><strong>Stop Interpreter</strong> - End the real-time interpretation session</li>
|
|
</ul>
|
|
<p class="text-muted">
|
|
<small>
|
|
The interpreter will automatically detect speech, transcribe, translate, and speak the translation with minimal delay.
|
|
Pause detection automatically handles natural breaks in conversation.
|
|
</small>
|
|
</p>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
|
|
<audio id="audioPlayer" style="display: none;"></audio>
|
|
</div>
|
|
|
|
<script src="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0-alpha1/dist/js/bootstrap.bundle.min.js"></script>
|
|
<script src="/static/js/app.js"></script>
|
|
</body>
|
|
</html>
|