| from flask import Flask, request, jsonify, send_from_directory |
| from flask_cors import CORS |
| import sqlite3 |
| import os |
| import uuid |
| from datetime import datetime |
| from werkzeug.utils import secure_filename |
| import threading |
| import subprocess |
| import time |
|
|
| app = Flask(__name__) |
| CORS(app) |
|
|
| UPLOAD_FOLDER = 'uploads' |
| ALLOWED_EXTENSIONS = {'wav', 'mp3', 'flac', 'ogg', 'm4a', 'aac'} |
|
|
| os.makedirs(UPLOAD_FOLDER, exist_ok=True) |
| os.makedirs('temp_dir', exist_ok=True) |
|
|
| |
| worker_thread = None |
| worker_running = False |
|
|
| def init_db(): |
| conn = sqlite3.connect('audio_captions.db') |
| c = conn.cursor() |
| c.execute('''CREATE TABLE IF NOT EXISTS audio_files |
| (id TEXT PRIMARY KEY, |
| filename TEXT NOT NULL, |
| filepath TEXT NOT NULL, |
| status TEXT NOT NULL, |
| caption TEXT, |
| created_at TEXT NOT NULL, |
| processed_at TEXT)''') |
| conn.commit() |
| conn.close() |
|
|
| def allowed_file(filename): |
| return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS |
|
|
| def start_worker(): |
| """Start the worker thread if not already running""" |
| global worker_thread, worker_running |
| |
| if not worker_running: |
| worker_running = True |
| worker_thread = threading.Thread(target=worker_loop, daemon=True) |
| worker_thread.start() |
| print("β
Worker thread started") |
|
|
| def worker_loop(): |
| """Main worker loop that processes audio files""" |
| print("π€ STT Worker started. Monitoring for new audio files...") |
| |
| CWD = "./" |
| PYTHON_PATH = "stt-transcribe" |
| STT_MODEL_NAME = "fasterwhispher" |
| POLL_INTERVAL = 3 |
| |
| import shlex |
| import json |
| |
| while worker_running: |
| try: |
| |
| conn = sqlite3.connect('audio_captions.db') |
| conn.row_factory = sqlite3.Row |
| c = conn.cursor() |
| c.execute('''SELECT * FROM audio_files |
| WHERE status = 'not_started' |
| ORDER BY created_at ASC |
| LIMIT 1''') |
| row = c.fetchone() |
| conn.close() |
| |
| if row: |
| file_id = row['id'] |
| filepath = row['filepath'] |
| filename = row['filename'] |
| |
| print(f"\n{'='*60}") |
| print(f"π΅ Processing: {filename}") |
| print(f"π ID: {file_id}") |
| print(f"{'='*60}") |
| |
| |
| update_status(file_id, 'processing') |
| |
| try: |
| |
| print(f"π Running STT on: {os.path.abspath(filepath)}") |
| command = f"""cd {CWD} && {PYTHON_PATH} --input {shlex.quote(os.path.abspath(filepath))} --model {STT_MODEL_NAME}""" |
| |
| subprocess.run( |
| command, |
| shell=True, |
| executable="/bin/bash", |
| check=True, |
| cwd=CWD, |
| env={ |
| **os.environ, |
| 'PYTHONUNBUFFERED': '1', |
| 'CUDA_LAUNCH_BLOCKING': '1', |
| 'USE_CPU_IF_POSSIBLE': 'true' |
| } |
| ) |
| |
| |
| output_path = f'{CWD}/temp_dir/output_transcription.json' |
| with open(output_path, 'r') as file: |
| result = json.loads(file.read().strip()) |
| |
| |
| caption = result.get('text', '') or result.get('transcription', '') or str(result) |
| |
| print(f"β
Successfully processed: {filename}") |
| print(f"π Caption preview: {caption[:100]}...") |
| |
| |
| update_status(file_id, 'completed', caption=json.dumps(result)) |
| |
| |
| if os.path.exists(filepath): |
| os.remove(filepath) |
| print(f"ποΈ Deleted audio file: {filepath}") |
| |
| except Exception as e: |
| print(f"β Failed to process: {filename}") |
| print(f"Error: {str(e)}") |
| update_status(file_id, 'failed', error=str(e)) |
| |
| |
| |
| |
| else: |
| |
| time.sleep(POLL_INTERVAL) |
| |
| except Exception as e: |
| print(f"β οΈ Worker error: {str(e)}") |
| time.sleep(POLL_INTERVAL) |
|
|
| def update_status(file_id, status, caption=None, error=None): |
| """Update the status of a file in the database""" |
| conn = sqlite3.connect('audio_captions.db') |
| c = conn.cursor() |
| |
| if status == 'completed': |
| c.execute('''UPDATE audio_files |
| SET status = ?, caption = ?, processed_at = ? |
| WHERE id = ?''', |
| (status, caption, datetime.now().isoformat(), file_id)) |
| elif status == 'failed': |
| c.execute('''UPDATE audio_files |
| SET status = ?, caption = ?, processed_at = ? |
| WHERE id = ?''', |
| (status, f"Error: {error}", datetime.now().isoformat(), file_id)) |
| else: |
| c.execute('UPDATE audio_files SET status = ? WHERE id = ?', (status, file_id)) |
| |
| conn.commit() |
| conn.close() |
|
|
| @app.route('/') |
| def index(): |
| return send_from_directory('.', 'index.html') |
|
|
| @app.route('/api/upload', methods=['POST']) |
| def upload_audio(): |
| if 'audio' not in request.files: |
| return jsonify({'error': 'No audio file provided'}), 400 |
| |
| file = request.files['audio'] |
| |
| if file.filename == '': |
| return jsonify({'error': 'No file selected'}), 400 |
| |
| if not allowed_file(file.filename): |
| return jsonify({'error': 'Invalid file type'}), 400 |
| |
| file_id = str(uuid.uuid4()) |
| filename = secure_filename(file.filename) |
| filepath = os.path.join(UPLOAD_FOLDER, f"{file_id}_{filename}") |
| file.save(filepath) |
| |
| conn = sqlite3.connect('audio_captions.db') |
| c = conn.cursor() |
| c.execute('''INSERT INTO audio_files |
| (id, filename, filepath, status, created_at) |
| VALUES (?, ?, ?, ?, ?)''', |
| (file_id, filename, filepath, 'not_started', datetime.now().isoformat())) |
| conn.commit() |
| conn.close() |
| |
| |
| start_worker() |
| |
| return jsonify({ |
| 'id': file_id, |
| 'filename': filename, |
| 'status': 'not_started', |
| 'message': 'File uploaded successfully' |
| }), 201 |
|
|
| @app.route('/api/files', methods=['GET']) |
| def get_files(): |
| conn = sqlite3.connect('audio_captions.db') |
| conn.row_factory = sqlite3.Row |
| c = conn.cursor() |
| c.execute('SELECT * FROM audio_files ORDER BY created_at DESC') |
| rows = c.fetchall() |
| conn.close() |
| |
| files = [] |
| for row in rows: |
| files.append({ |
| 'id': row['id'], |
| 'filename': row['filename'], |
| 'status': row['status'], |
| 'caption': row['caption'], |
| 'created_at': row['created_at'], |
| 'processed_at': row['processed_at'] |
| }) |
| |
| return jsonify(files) |
|
|
| @app.route('/api/files/<file_id>', methods=['GET']) |
| def get_file(file_id): |
| conn = sqlite3.connect('audio_captions.db') |
| conn.row_factory = sqlite3.Row |
| c = conn.cursor() |
| c.execute('SELECT * FROM audio_files WHERE id = ?', (file_id,)) |
| row = c.fetchone() |
| conn.close() |
| |
| if row is None: |
| return jsonify({'error': 'File not found'}), 404 |
| |
| return jsonify({ |
| 'id': row['id'], |
| 'filename': row['filename'], |
| 'status': row['status'], |
| 'caption': row['caption'], |
| 'created_at': row['created_at'], |
| 'processed_at': row['processed_at'] |
| }) |
|
|
| @app.route('/health', methods=['GET']) |
| def health(): |
| return jsonify({ |
| 'status': 'healthy', |
| 'service': 'audio-caption-generator', |
| 'worker_running': worker_running |
| }) |
|
|
| if __name__ == '__main__': |
| init_db() |
| print("\n" + "="*60) |
| print("π Audio Caption Generator API Server") |
| print("="*60) |
| print("π Worker will start automatically on first upload") |
| print("ποΈ Audio files will be deleted after successful processing") |
| print("="*60 + "\n") |
| |
| |
| port = int(os.environ.get('PORT', 7860)) |
| app.run(debug=False, host='0.0.0.0', port=port) |