lite

2025-06-18 19:28:48 +05:30 · 2025-06-18 19:28:48 +05:30 · 1c43f63b70
parent 4d20931ecc
commit 1c43f63b70
2 changed files with 64 additions and 49 deletions
--- a/app.py
+++ b/app.py
@ -3,73 +3,82 @@ import os
 import uuid
 import subprocess
 from werkzeug.utils import secure_filename
+import time
+import random

 app = Flask(__name__)
 UPLOAD_FOLDER = '/data'
 ALLOWED_EXTENSIONS = {'wav', 'mp3', 'ogg', 'flac'}

 def allowed_file(filename):
-return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS
+    return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS
+
+def generate_filename():
+    timestamp = int(time.time())
+    random_num = random.randint(1000, 9999)
+    return f"{timestamp}-{random_num}"

@app.route('/stt', methods=['POST'])
 def transcribe():
-if 'audio' not in request.files:
-return jsonify({"error": "No audio file provided"}), 400
+    if 'audio' not in request.files:
+        return jsonify({"error": "No audio file provided"}), 400

-file = request.files['audio']
-if file.filename == '':
-return jsonify({"error": "Empty filename"}), 400
+    file = request.files['audio']
+    if file.filename == '':
+        return jsonify({"error": "Empty filename"}), 400

-if not file or not allowed_file(file.filename):
-return jsonify({"error": "Invalid file type"}), 400
+    if not file or not allowed_file(file.filename):
+        return jsonify({"error": "Invalid file type"}), 400

-try:
-# Generate unique filename
-file_id = str(uuid.uuid4())
-orig_ext = secure_filename(file.filename).rsplit('.', 1)[1].lower()
-orig_path = os.path.join(UPLOAD_FOLDER, f"{file_id}.{orig_ext}")
-wav_path = os.path.join(UPLOAD_FOLDER, f"{file_id}.wav")
-output_base = os.path.join(UPLOAD_FOLDER, file_id)
+    try:
+        # Generate filename with timestamp + random number
+        file_base = generate_filename()
+        orig_ext = secure_filename(file.filename).rsplit('.', 1)[1].lower()
+        orig_path = os.path.join(UPLOAD_FOLDER, f"{file_base}.{orig_ext}")
+        wav_path = os.path.join(UPLOAD_FOLDER, f"{file_base}.wav")
+        output_base = os.path.join(UPLOAD_FOLDER, file_base)

-# Save original file
-file.save(orig_path)
+        # Save original file
+        file.save(orig_path)

-# Convert to WAV if needed
-if orig_ext != 'wav':
-subprocess.run([
-'ffmpeg', '-i', orig_path,
-'-ar', '16000', '-ac', '1', '-c:a', 'pcm_s16le', wav_path
-], check=True)
-os.remove(orig_path)
-audio_path = wav_path
-else:
-audio_path = orig_path
+        # Convert to WAV if needed
+        if orig_ext != 'wav':
+            subprocess.run([
+                'ffmpeg', '-i', orig_path,
+                '-ar', '16000', '-ac', '1', '-c:a', 'pcm_s16le', wav_path
+            ], check=True)
+            os.remove(orig_path)
+            audio_path = wav_path
+        else:
+            audio_path = orig_path

-# Run whisper.cpp
-subprocess.run([
-'/app/whisper.cpp/build/bin/main',
-'-m', '/app/whisper.cpp/models/ggml-base.bin',
-'-f', audio_path,
-'-otxt', '-of', output_base
-], check=True)
+        # Run whisper.cpp
+        subprocess.run([
+            '/app/whisper.cpp/build/bin/main',
+            '-m', '/app/whisper.cpp/models/ggml-tiny.en-q5_1.bin',
+            '-f', audio_path,
+            '-otxt', '-of', output_base
+        ], check=True)

-# Read output
-output_file = f"{output_base}.txt"
-with open(output_file, 'r') as f:
-transcription = f.read()
+        # Read output
+        output_file = f"{output_base}.txt"
+        with open(output_file, 'r') as f:
+            transcription = f.read()

-# Cleanup
-for f in [orig_path, wav_path, audio_path, output_file]:
-if os.path.exists(f):
-os.remove(f)
+        # Return the filenames in the response
+        response = {
+            "text": transcription.strip(),
+            "audio_file": f"{file_base}.{orig_ext}",
+            "text_file": f"{file_base}.txt"
+        }

-return jsonify({"text": transcription.strip()})
+        return jsonify(response)

-except subprocess.CalledProcessError as e:
-return jsonify({"error": f"Whisper processing failed: {e.stderr}"}), 500
-except Exception as e:
-return jsonify({"error": str(e)}), 500
+    except subprocess.CalledProcessError as e:
+        return jsonify({"error": f"Whisper processing failed: {e.stderr}"}), 500
+    except Exception as e:
+        return jsonify({"error": str(e)}), 500

 if __name__ == '__main__':
-os.makedirs(UPLOAD_FOLDER, exist_ok=True)
-app.run(host='0.0.0.0', port=4004)
+    os.makedirs(UPLOAD_FOLDER, exist_ok=True)
+    app.run(host='0.0.0.0', port=4004)
--- a/6
+++ b/6
@ -0,0 +1,6 @@
+docker build -t whisper-api .
+
+docker run -itd --name stt-41-lite -p 4004:4004 \
+-v $(pwd)/whisper.cpp-1.5.2/models:/models \
+-v $(pwd)/data:/data \
+whisper-api