RohanExploit · RohanExploit · Jan 30, 2026 · Jan 30, 2026 · Jan 30, 2026 · Jan 30, 2026
diff --git a/backend/hf_api_service.py b/backend/hf_api_service.py
@@ -30,6 +30,9 @@
 # Audio Classification Model
 AUDIO_CLASS_API_URL = "https://router.huggingface.co/models/MIT/ast-finetuned-audioset-10-10-0.4593"
 
+# Audio Transcription Model
+WHISPER_API_URL = "https://router.huggingface.co/models/openai/whisper-large-v3-turbo"
+
 async def _make_request(client, url, payload):
     try:
         response = await client.post(url, headers=headers, json=payload, timeout=20.0)
@@ -166,6 +169,33 @@ async def do_post(c):
         logger.error(f"Audio Detection Error: {e}")
         return []
 
+async def transcribe_audio(audio_bytes: bytes, client: httpx.AsyncClient = None):
+    """
+    Transcribes audio using OpenAI Whisper via Hugging Face API.
+    """
+    try:
+        headers_bin = {"Authorization": f"Bearer {token}"} if token else {}
+
+        async def do_post(c):
+             return await c.post(WHISPER_API_URL, headers=headers_bin, content=audio_bytes, timeout=30.0)
+
+        if client:
+            response = await do_post(client)
+        else:
+            async with httpx.AsyncClient() as new_client:
+                response = await do_post(new_client)
+
+        if response.status_code == 200:
+            # Result is usually {"text": "..."}
+            data = response.json()
+            return data.get("text", "")
+        else:
+            logger.error(f"Whisper API Error: {response.status_code} - {response.text}")
+            return ""
+    except Exception as e:
+        logger.error(f"Audio Transcription Error: {e}")
+        return ""
+
 async def detect_severity_clip(image: Union[Image.Image, bytes], client: httpx.AsyncClient = None):
     """
     Returns a severity object: {level: 'High', confidence: 0.9, raw_label: 'critical...'}

diff --git a/backend/main.py b/backend/main.py
@@ -4,11 +4,11 @@
 from fastapi.middleware.gzip import GZipMiddleware
 from fastapi.concurrency import run_in_threadpool
 from sqlalchemy import func
-from sqlalchemy.orm import Session, defer
+from sqlalchemy.orm import Session, defer, joinedload
 from pydantic import BaseModel
 from contextlib import asynccontextmanager
 from functools import lru_cache
-from typing import List, Union, Any, Dict
+from typing import List, Union, Any, Dict, Optional
 from datetime import datetime, timedelta, timezone
 from PIL import Image
 
@@ -79,7 +79,8 @@
     detect_water_leak_clip,
     detect_accessibility_issue_clip,
     detect_crowd_density_clip,
-    detect_audio_event
+    detect_audio_event,
+    transcribe_audio
 )
 
 # Configure structured logging
@@ -1409,6 +1410,27 @@ async def detect_audio_endpoint(request: Request, file: UploadFile = File(...)):
         raise HTTPException(status_code=500, detail="Internal server error")
 
 
+@app.post("/api/transcribe-audio")
+async def transcribe_audio_endpoint(request: Request, file: UploadFile = File(...)):
+    # Basic audio validation
+    if hasattr(file, 'size') and file.size and file.size > 25 * 1024 * 1024:
+         raise HTTPException(status_code=413, detail="Audio file too large (max 25MB)")
+
+    try:
+        audio_bytes = await file.read()
-        audio_bytes = await file.read()
+        audio_bytes = await file.read()
+        # Enforce size limit based on actual bytes read, in case file.size is missing or inaccurate
+        if len(audio_bytes) > 25 * 1024 * 1024:
+             raise HTTPException(status_code=413, detail="Audio file too large (max 25MB)")
-        audio_bytes = await file.read()
+        audio_bytes = await file.read()
+        # Enforce size limit based on actual bytes read, in case file.size is missing or inaccurate
+        if len(audio_bytes) > 25 * 1024 * 1024:
+             raise HTTPException(status_code=413, detail="Audio file too large (max 25MB)")
+    except Exception as e:
+        logger.error(f"Invalid audio file: {e}", exc_info=True)
+        raise HTTPException(status_code=400, detail="Invalid audio file")
+
+    try:
+        client = request.app.state.http_client
+        text = await transcribe_audio(audio_bytes, client=client)
+        return {"text": text}
+    except Exception as e:
+        logger.error(f"Transcription error: {e}", exc_info=True)
+        raise HTTPException(status_code=500, detail="Internal server error")
+
+
 async def get_cached_or_compute(cache_key: str, compute_func, *args, **kwargs):
     """Get cached result or compute and cache it."""
     global _cache_cleanup_counter

diff --git a/frontend/eslint.config.js b/frontend/eslint.config.js
@@ -5,7 +5,7 @@ import reactRefresh from 'eslint-plugin-react-refresh'
 import { defineConfig, globalIgnores } from 'eslint/config'
 
 export default defineConfig([
-  globalIgnores(['dist']),
+  globalIgnores(['dist', '**/__tests__/**', '**/__mocks__/**', '**/*.test.js', 'src/setupTests.js']),
   {
     files: ['**/*.{js,jsx}'],
     extends: [