Spaces:

DangoMachoo
/

Bot-and-life_speech-to-Text

Runtime error

App Files Files Community

DangoMachoo commited on Apr 23

Commit

6f2d374

1 Parent(s): ac59c9e

add main code

Browse files

Files changed (3) hide show

.gitignore +21 -0
app.py +48 -0
requirements.txt +49 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,21 @@

+#virtual environment
+venv/
+# Gradio
+flagged/
+gradio_cached_examples/
+# Model weights
+*.pt
+*.ckpt
+*.pth
+# Media outputs
+*.png
+*.jpg
+*.mp4
+*.mp3
+#code tests
+app1.py
+app2.py

app.py ADDED Viewed

	@@ -0,0 +1,48 @@

+import gradio as gr
+import torch
+from transformers import pipeline
+import os
+# ✅ ใช้ path ffmpeg ชั่วคราวเฉพาะใน local
+#os.environ["PATH"] += os.pathsep + r"C:\ffmpeg\ffmpeg-master-latest-win64-gpl\ffmpeg-master-latest-win64-gpl\bin"
+# ✅ โมเดลที่ใช้
+MODEL_NAME = "biodatlab/whisper-th-small-combined"
+lang = "th"
+device = 0 if torch.cuda.is_available() else "cpu"
+pipe = pipeline(
+    task="automatic-speech-recognition",
+    model=MODEL_NAME,
+    chunk_length_s=30,
+    device=device,
+)
+# ✅ ฟังก์ชันแปลงเสียงเป็นข้อความ
+def transcribe_audio(audio):
+    result = pipe(audio, generate_kwargs={"language": "<|th|>", "task": "transcribe"}, batch_size=16)
+    text = result["text"]
+    return text, text  # ส่งทั้งแสดงบนหน้าจอ และโหลดเป็น .txt
+# ✅ UI ด้วย Gradio
+with gr.Blocks() as demo:
+    gr.Markdown("## 🎤 แปลงเสียงพูดภาษาไทยเป็นข้อความ")
+    with gr.Row():
+        audio_input = gr.Audio(label="อัปโหลดไฟล์เสียง (MP3)", type="filepath")
+    with gr.Row():
+        transcribed_text = gr.Textbox(label="📜 ข้อความที่แปลงแล้ว", lines=10)
+    with gr.Row():
+        copy_button = gr.Button("📋 Copy")
+        download_button = gr.File(label="⬇️ ดาวน์โหลด .txt")
+    # ปุ่มเริ่มแปลง
+    transcribe_btn = gr.Button("🔄 แปลงเสียงเป็นข้อความ")
+    # เมื่อกดปุ่ม
+    transcribe_btn.click(
+        fn=transcribe_audio,
+        inputs=audio_input,
+        outputs=[transcribed_text, download_button]
+    )
+demo.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,49 @@

+audioop-lts==0.2.1
+audioread==3.0.1
+certifi==2025.1.31
+cffi==1.17.1
+charset-normalizer==3.4.1
+colorama==0.4.6
+decorator==5.2.1
+ffmpeg-python==0.2.0
+filelock==3.18.0
+fsspec==2025.3.2
+future==1.0.0
+huggingface-hub==0.30.2
+idna==3.10
+Jinja2==3.1.6
+joblib==1.4.2
+lazy_loader==0.4
+librosa==0.11.0
+llvmlite==0.44.0
+MarkupSafe==3.0.2
+mpmath==1.3.0
+msgpack==1.1.0
+networkx==3.4.2
+numba==0.61.2
+numpy==2.2.5
+packaging==25.0
+platformdirs==4.3.7
+pooch==1.8.2
+pycparser==2.22
+PyYAML==6.0.2
+regex==2024.11.6
+requests==2.32.3
+safetensors==0.5.3
+scikit-learn==1.6.1
+scipy==1.15.2
+setuptools==79.0.0
+soundfile==0.13.1
+soxr==0.5.0.post1
+standard-aifc==3.13.0
+standard-chunk==3.13.0
+standard-sunau==3.13.0
+sympy==1.13.1
+threadpoolctl==3.6.0
+tokenizers==0.21.1
+torch==2.6.0
+torchaudio==2.6.0
+tqdm==4.67.1
+transformers @ git+https://github.com/huggingface/transformers@ca790303f7480e0211e5b58b9e22706f46dbf19a
+typing_extensions==4.13.2
+urllib3==2.4.0