Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -139,11 +139,29 @@ def convert_text_to_speech(input_text, source_language, target_language):
|
|
| 139 |
api_name="/run" # API name
|
| 140 |
)
|
| 141 |
|
| 142 |
-
# Check if result contains files
|
| 143 |
if isinstance(result, list) and len(result) > 1:
|
| 144 |
-
|
| 145 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 146 |
|
|
|
|
|
|
|
|
|
|
| 147 |
# Iterate over the result to find the last text item
|
| 148 |
translated_text = ""
|
| 149 |
for item in result:
|
|
@@ -365,7 +383,6 @@ def process_and_query(input_language=None, audio_input=None, image_input=None, t
|
|
| 365 |
markdown_output = ""
|
| 366 |
image_text = ""
|
| 367 |
translated_text = ""
|
| 368 |
-
audio_file_path = ""
|
| 369 |
audio_output = ""
|
| 370 |
# Debugging print statement
|
| 371 |
print(f"Image Input Type: {type(image_input)}, Audio Input Type: {type(audio_input)}")
|
|
@@ -416,7 +433,7 @@ def process_and_query(input_language=None, audio_input=None, image_input=None, t
|
|
| 416 |
|
| 417 |
# Convert translated text to speech and get both audio file and text
|
| 418 |
target_language = "English" # Set the target language for the speech
|
| 419 |
-
|
| 420 |
|
| 421 |
# Evaluate hallucination
|
| 422 |
hallucination_label = evaluate_hallucination(final_response, summary)
|
|
|
|
| 139 |
api_name="/run" # API name
|
| 140 |
)
|
| 141 |
|
| 142 |
+
# Check if result contains files
|
| 143 |
if isinstance(result, list) and len(result) > 1:
|
| 144 |
+
downloaded_files = []
|
| 145 |
+
for file_path in result[1:]:
|
| 146 |
+
if os.path.isfile(file_path):
|
| 147 |
+
# Download the file
|
| 148 |
+
downloaded_files.append(file_path)
|
| 149 |
+
else:
|
| 150 |
+
print(f"Path is not a file: {file_path}")
|
| 151 |
+
|
| 152 |
+
if downloaded_files:
|
| 153 |
+
# Process only the first file
|
| 154 |
+
original_audio_file = downloaded_files[0]
|
| 155 |
+
new_file_name = f"audio_output_{uuid.uuid4()}.wav"
|
| 156 |
+
new_file_path = os.path.join(os.path.dirname(original_audio_file), new_file_name)
|
| 157 |
+
os.rename(original_audio_file, new_file_path)
|
| 158 |
+
return new_file_path
|
| 159 |
+
else:
|
| 160 |
+
return "No valid audio files were downloaded."
|
| 161 |
|
| 162 |
+
else:
|
| 163 |
+
return "No audio files received from the API."
|
| 164 |
+
|
| 165 |
# Iterate over the result to find the last text item
|
| 166 |
translated_text = ""
|
| 167 |
for item in result:
|
|
|
|
| 383 |
markdown_output = ""
|
| 384 |
image_text = ""
|
| 385 |
translated_text = ""
|
|
|
|
| 386 |
audio_output = ""
|
| 387 |
# Debugging print statement
|
| 388 |
print(f"Image Input Type: {type(image_input)}, Audio Input Type: {type(audio_input)}")
|
|
|
|
| 433 |
|
| 434 |
# Convert translated text to speech and get both audio file and text
|
| 435 |
target_language = "English" # Set the target language for the speech
|
| 436 |
+
audio_output, translated_text = convert_text_to_speech(final_response, target_language, input_language)
|
| 437 |
|
| 438 |
# Evaluate hallucination
|
| 439 |
hallucination_label = evaluate_hallucination(final_response, summary)
|