Update src/streamlit_app.py
Browse files- src/streamlit_app.py +18 -2
src/streamlit_app.py
CHANGED
|
@@ -1104,6 +1104,13 @@ if language_option == "Specify Language":
|
|
| 1104 |
)
|
| 1105 |
selected_language = language_codes[selected_language_name]
|
| 1106 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1107 |
# Load models
|
| 1108 |
with st.spinner(f"Loading models..."):
|
| 1109 |
model = load_whisper_model(model_size)
|
|
@@ -1209,8 +1216,17 @@ if uploaded_file is not None:
|
|
| 1209 |
"best_of": 1, # Use single best result
|
| 1210 |
"beam_size": 5, # Beam search size for better accuracy
|
| 1211 |
}
|
| 1212 |
-
|
| 1213 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1214 |
|
| 1215 |
# Show progress
|
| 1216 |
progress_placeholder = st.empty()
|
|
|
|
| 1104 |
)
|
| 1105 |
selected_language = language_codes[selected_language_name]
|
| 1106 |
|
| 1107 |
+
# Translation option: always output English text (for Hindi and other languages)
|
| 1108 |
+
translate_to_english = st.sidebar.checkbox(
|
| 1109 |
+
"Translate non-English speech to English text",
|
| 1110 |
+
value=True,
|
| 1111 |
+
help="When enabled, Whisper will output English text even if the speakers are talking in Hindi or other languages."
|
| 1112 |
+
)
|
| 1113 |
+
|
| 1114 |
# Load models
|
| 1115 |
with st.spinner(f"Loading models..."):
|
| 1116 |
model = load_whisper_model(model_size)
|
|
|
|
| 1216 |
"best_of": 1, # Use single best result
|
| 1217 |
"beam_size": 5, # Beam search size for better accuracy
|
| 1218 |
}
|
| 1219 |
+
# Language and translation handling
|
| 1220 |
+
if translate_to_english:
|
| 1221 |
+
# Ask Whisper to translate any non-English speech into English text
|
| 1222 |
+
transcribe_options["task"] = "translate"
|
| 1223 |
+
# If the user explicitly selected a source language (e.g. Hindi), pass it as the input language
|
| 1224 |
+
if selected_language and selected_language != "en":
|
| 1225 |
+
transcribe_options["language"] = selected_language
|
| 1226 |
+
else:
|
| 1227 |
+
# Normal transcription in the spoken language
|
| 1228 |
+
if selected_language:
|
| 1229 |
+
transcribe_options["language"] = selected_language
|
| 1230 |
|
| 1231 |
# Show progress
|
| 1232 |
progress_placeholder = st.empty()
|