From 44beeacd3e33019866f269e6f6d9a881fb99147a Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Fri, 5 Dec 2025 17:44:22 +0530
Subject: [PATCH 01/10] audio upload extension with gdrive credentials

---
 backends/advanced/pyproject.toml              |  3 +
 .../src/advanced_omi_backend/app_config.py    | 24 +++++
 .../routers/modules/audio_routes.py           | 14 +++
 .../utils/gdrive_audio_utils.py               | 87 +++++++++++++++++++
 backends/advanced/webui/src/pages/Upload.tsx  | 81 +++++++++++++++++
 backends/advanced/webui/src/services/api.ts   | 11 ++-
 6 files changed, 218 insertions(+), 2 deletions(-)
 create mode 100644 backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py

diff --git a/backends/advanced/pyproject.toml b/backends/advanced/pyproject.toml
index 5f635cbb..b021d8d4 100644
--- a/backends/advanced/pyproject.toml
+++ b/backends/advanced/pyproject.toml
@@ -24,6 +24,9 @@ dependencies = [
     "redis>=5.0.0",
     "rq>=1.16.0",
     "soundfile>=0.12.1",
+    "google-api-python-client>=2.0.0",
+    "google-auth-oauthlib>=1.0.0",
+    "google-auth-httplib2>=0.2.0",
 ]
 
 [project.optional-dependencies]
diff --git a/backends/advanced/src/advanced_omi_backend/app_config.py b/backends/advanced/src/advanced_omi_backend/app_config.py
index 4caa70c5..330028a7 100644
--- a/backends/advanced/src/advanced_omi_backend/app_config.py
+++ b/backends/advanced/src/advanced_omi_backend/app_config.py
@@ -85,6 +85,30 @@ def __init__(self):
         # Memory service configuration
         self.memory_service_supports_threshold = self.memory_provider == "friend_lite"
 
+        self.gdrive_credentials_path = "data/gdrive_service_account.json"
+        self.gdrive_scopes = ["https://www.googleapis.com/auth/drive.readonly"]
+        self._gdrive_service = None
+
+    def get_gdrive_service(self):
+        """Return Google Drive API client using stored service account."""
+        from google.oauth2.service_account import Credentials
+        from googleapiclient.discovery import build
+        if self._gdrive_service:
+            return self._gdrive_service
+
+        if not os.path.exists(self.gdrive_credentials_path):
+            raise FileNotFoundError(
+                f"Missing Google Drive credentials at {self.gdrive_credentials_path}"
+            )
+
+        creds = Credentials.from_service_account_file(
+            self.gdrive_credentials_path,
+            scopes=self.gdrive_scopes,
+        )
+
+        self._gdrive_service = build("drive", "v3", credentials=creds)
+        return self._gdrive_service
+
 
 # Global configuration instance
 app_config = AppConfig()
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
index 4c0f756b..4ebdcce2 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
@@ -12,10 +12,24 @@
 from advanced_omi_backend.controllers import audio_controller
 from advanced_omi_backend.models.user import User
 from advanced_omi_backend.app_config import get_audio_chunk_dir
+from advanced_omi_backend.utils.gdrive_audio_utils import download_audio_files_from_drive
 
 router = APIRouter(prefix="/audio", tags=["audio"])
 
 
+@router.post("/upload_audio_from_url")
+async def upload_audio_from_drive_folder(
+    drive_folder_id: str = Query(...,alias="url", description="Google Drive Folder ID containing audio files (e.g., the string after /folders/ in the URL)"),
+    current_user: User = Depends(current_superuser),
+    device_name: str = Query(default="upload"),
+    auto_generate_client: bool = Query(default=True),
+):
+    files = await download_audio_files_from_drive(drive_folder_id)
+
+    return await audio_controller.upload_and_process_audio_files(
+        current_user, files, device_name, auto_generate_client
+    )
+
 @router.post("/upload")
 async def upload_audio_files(
     current_user: User = Depends(current_superuser),
diff --git a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
new file mode 100644
index 00000000..d664162e
--- /dev/null
+++ b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
@@ -0,0 +1,87 @@
+import os
+import io
+import tempfile
+from typing import List
+from starlette.datastructures import UploadFile as StarletteUploadFile
+from googleapiclient.http import MediaIoBaseDownload
+from advanced_omi_backend.app_config import get_app_config
+
+AUDIO_EXTENSIONS = (".wav", ".mp3", ".flac", ".ogg")
+FOLDER_MIMETYPE = "application/vnd.google-apps.folder"
+
+
+class AudioValidationError(Exception):
+    pass
+
+
+# -------------------------------------------------------------
+# DOWNLOAD A SINGLE FILE (OAUTH)
+# -------------------------------------------------------------
+async def download_and_wrap_drive_file(service, file_item):
+    file_id = file_item["id"]
+    name = file_item["name"]
+
+    request = service.files().get_media(fileId=file_id)
+
+    fh = io.BytesIO()
+    downloader = MediaIoBaseDownload(fh, request)
+
+    done = False
+    while not done:
+        status, done = downloader.next_chunk()
+
+    content = fh.getvalue()
+
+    if not content:
+        raise AudioValidationError(f"Downloaded Google Drive file '{name}' was empty")
+
+    tmp_file = tempfile.NamedTemporaryFile(delete=False)
+    tmp_file.write(content)
+    tmp_file.flush()
+
+    # Wrap in Starlette UploadFile to mimic standard uploads
+    return StarletteUploadFile(
+        filename=name,
+        file=open(tmp_file.name, "rb"),
+    )
+
+
+# -------------------------------------------------------------
+# LIST + DOWNLOAD FILES IN FOLDER (OAUTH)
+# -------------------------------------------------------------
+async def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploadFile]:
+    if not folder_id:
+        raise AudioValidationError("Google Drive folder ID is required.")
+
+    service = get_app_config().get_gdrive_service()
+
+    try:
+        query = f"'{folder_id}' in parents and trashed = false"
+
+        response = service.files().list(
+            q=query,
+            fields="files(id, name, mimeType)",
+            includeItemsFromAllDrives=False,
+            supportsAllDrives=False,
+        ).execute()
+
+        all_files = response.get("files", [])
+
+        audio_files = [
+            f for f in all_files
+            if f["name"].lower().endswith(AUDIO_EXTENSIONS)
+        ]
+
+        if not audio_files:
+            raise AudioValidationError("No audio files found in folder.")
+
+        wrapped_files = []
+        for item in audio_files:
+            wrapped_files.append(await download_and_wrap_drive_file(service, item))
+
+        return wrapped_files
+
+    except Exception as e:
+        if isinstance(e, AudioValidationError):
+            raise
+        raise AudioValidationError(f"Google Drive API Error: {repr(e)}")
diff --git a/backends/advanced/webui/src/pages/Upload.tsx b/backends/advanced/webui/src/pages/Upload.tsx
index 04e7d24c..ae20b39b 100644
--- a/backends/advanced/webui/src/pages/Upload.tsx
+++ b/backends/advanced/webui/src/pages/Upload.tsx
@@ -15,11 +15,53 @@ export default function Upload() {
   const [isUploading, setIsUploading] = useState(false)
   const [dragActive, setDragActive] = useState(false)
   const [uploadProgress, setUploadProgress] = useState(0)
+  const [audioUrl, setAudioUrl] = useState('')
 
   const { isAdmin } = useAuth()
 
   const generateId = () => Math.random().toString(36).substr(2, 9)
 
+  const [urlUploadStatus, setUrlUploadStatus] = useState<{
+  type: 'success' | 'error' | null
+  message: string
+}>({ type: null, message: '' })
+
+
+  // Handle URL submission
+  const handleUrlSubmit = async () => {
+  if (!audioUrl) return
+
+  setIsUploading(true)
+  setUrlUploadStatus({ type: null, message: '' })
+
+  try {
+    const response = await uploadApi.uploadAudioFromUrl({
+      drive_folder_id: audioUrl,
+      device_name: 'upload',
+      auto_generate_client: true,
+    })
+
+    console.log('URL Upload response:', response)
+
+    setUrlUploadStatus({
+      type: 'success',
+      message: `Audio submitted successfully`,
+    })
+
+    setAudioUrl('')
+  } catch (err: any) {
+    console.error('URL upload failed:', err)
+
+    setUrlUploadStatus({
+      type: 'error',
+      message:
+        err?.response?.data?.detail || 'Failed to upload audio from URL',
+    })
+  } finally {
+    setIsUploading(false)
+  }
+}
+
   const handleFileSelect = (selectedFiles: FileList | null) => {
     if (!selectedFiles) return
 
@@ -152,6 +194,44 @@ export default function Upload() {
           Upload Audio Files
         </h1>
       </div>
+      {/* URL Input */}
+      <div className="mb-6 p-4 bg-gray-50 dark:bg-gray-700 rounded-lg border border-gray-200 dark:border-gray-600">
+  <label className="block mb-2 font-medium text-gray-900 dark:text-gray-100">
+    Paste audio URL:
+  </label>
+
+  <div className="flex space-x-2">
+    <input
+      type="text"
+      value={audioUrl}
+      onChange={(e) => setAudioUrl(e.target.value)}
+      placeholder="https://example.com/audio.wav"
+      className="flex-1 px-3 py-2 border rounded-lg dark:bg-gray-800 dark:text-gray-100"
+    />
+
+    <button
+      onClick={handleUrlSubmit}
+      disabled={isUploading || !audioUrl}
+      className="px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700 disabled:opacity-50 disabled:cursor-not-allowed"
+    >
+      {isUploading ? 'Submitting...' : 'Submit URL'}
+    </button>
+  </div>
+
+  {/* ✅ Add the status message here */}
+  {urlUploadStatus.type && (
+    <div
+      className={`mt-3 p-3 rounded-lg text-sm ${
+        urlUploadStatus.type === 'success'
+          ? 'bg-green-100 text-green-800 border border-green-300'
+          : 'bg-red-100 text-red-800 border border-red-300'
+      }`}
+    >
+      {urlUploadStatus.message}
+    </div>
+  )}
+</div>
+
 
       {/* Drop Zone */}
       <div
@@ -290,6 +370,7 @@ export default function Upload() {
           📝 Upload Instructions
         </h3>
         <ul className="text-sm text-yellow-700 dark:text-yellow-300 space-y-1">
+          <li>• Hello world</li>
           <li>• Audio files will be processed sequentially for transcription and memory extraction</li>
           <li>• Processing time varies based on audio length (roughly 3x the audio duration + 60s)</li>
           <li>• Large files or multiple files may cause timeout errors - this is normal</li>
diff --git a/backends/advanced/webui/src/services/api.ts b/backends/advanced/webui/src/services/api.ts
index abe7678c..0c4e20f7 100644
--- a/backends/advanced/webui/src/services/api.ts
+++ b/backends/advanced/webui/src/services/api.ts
@@ -165,7 +165,7 @@ export const queueApi = {
 }
 
 export const uploadApi = {
-  uploadAudioFiles: (files: FormData, onProgress?: (progress: number) => void) => 
+  uploadAudioFiles: (files: FormData, onProgress?: (progress: number) => void) =>
     api.post('/api/audio/upload', files, {
       headers: { 'Content-Type': 'multipart/form-data' },
       timeout: 300000, // 5 minutes
@@ -174,10 +174,17 @@ export const uploadApi = {
           const progress = Math.round((progressEvent.loaded * 100) / progressEvent.total)
           onProgress(progress)
         }
-      }
+      },
+    }),
+
+  uploadAudioFromUrl: (payload: { drive_folder_id: string; device_name?: string; auto_generate_client?: boolean }) =>
+    api.post('/api/audio/upload_audio_from_url', null, {
+      params: payload.drive_folder_id,
+      timeout: 300000, // optional: 5 minutes
     }),
 }
 
+
 export const chatApi = {
   // Session management
   createSession: (title?: string) => api.post('/api/chat/sessions', { title }),

From d5b9518ddb955eb2a1f02bc35f3a9ec24bccddb9 Mon Sep 17 00:00:00 2001
From: Pratham Savaliya <pratham21btai35@karnavatiuniversity.edu.in>
Date: Fri, 5 Dec 2025 22:11:35 +0530
Subject: [PATCH 02/10] FIX: API parameters

---
 backends/advanced/webui/src/services/api.ts | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/backends/advanced/webui/src/services/api.ts b/backends/advanced/webui/src/services/api.ts
index 0c4e20f7..fc0de23c 100644
--- a/backends/advanced/webui/src/services/api.ts
+++ b/backends/advanced/webui/src/services/api.ts
@@ -177,10 +177,16 @@ export const uploadApi = {
       },
     }),
 
-  uploadAudioFromUrl: (payload: { drive_folder_id: string; device_name?: string; auto_generate_client?: boolean }) =>
-    api.post('/api/audio/upload_audio_from_url', null, {
-      params: payload.drive_folder_id,
-      timeout: 300000, // optional: 5 minutes
+uploadAudioFromUrl: (payload: { drive_folder_id: string; device_name?: string; auto_generate_client?: boolean }) =>
+    // 1. Set the POST body to null (or leave it out, though explicit null is cleaner for no body)
+    api.post('/api/audio/upload_audio_from_url', null, { 
+      // 2. Pass the entire payload object to the 'params' configuration key
+      params: { 
+        url: payload.drive_folder_id, // IMPORTANT: Use 'url' here to match the backend's alias
+        device_name: payload.device_name,
+        auto_generate_client: payload.auto_generate_client,
+      },
+      timeout: 300000,
     }),
 }
 

From 5b5ea64aaac1e44c9cbadfb4eeb50d8f047e8c06 Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Mon, 8 Dec 2025 16:54:19 +0530
Subject: [PATCH 03/10] UPDATE: tmp files cleanup n code refactored as per
 review

---
 .../utils/gdrive_audio_utils.py               | 27 +++++++++++++------
 backends/advanced/webui/src/pages/Upload.tsx  |  1 -
 2 files changed, 19 insertions(+), 9 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
index d664162e..6ce4c411 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
@@ -1,12 +1,13 @@
 import os
 import io
 import tempfile
+import atexit
 from typing import List
 from starlette.datastructures import UploadFile as StarletteUploadFile
 from googleapiclient.http import MediaIoBaseDownload
 from advanced_omi_backend.app_config import get_app_config
 
-AUDIO_EXTENSIONS = (".wav", ".mp3", ".flac", ".ogg")
+AUDIO_EXTENSIONS = (".wav", ".mp3", ".flac", ".ogg", ".m4a")
 FOLDER_MIMETYPE = "application/vnd.google-apps.folder"
 
 
@@ -35,15 +36,25 @@ async def download_and_wrap_drive_file(service, file_item):
     if not content:
         raise AudioValidationError(f"Downloaded Google Drive file '{name}' was empty")
 
-    tmp_file = tempfile.NamedTemporaryFile(delete=False)
+    tmp_file = tempfile.SpooledTemporaryFile(max_size=10*1024*1024)  # 10 MB
     tmp_file.write(content)
-    tmp_file.flush()
+    tmp_file.seek(0)
+    upload_file = StarletteUploadFile(filename=name, file=tmp_file)
 
-    # Wrap in Starlette UploadFile to mimic standard uploads
-    return StarletteUploadFile(
-        filename=name,
-        file=open(tmp_file.name, "rb"),
-    )
+    original_close = upload_file.close
+
+    def wrapped_close():
+        try:
+            original_close()
+        finally:
+            try:
+                os.unlink(tmp_file.name)
+            except FileNotFoundError:
+                pass
+
+    upload_file.close = wrapped_close
+
+    return upload_file
 
 
 # -------------------------------------------------------------
diff --git a/backends/advanced/webui/src/pages/Upload.tsx b/backends/advanced/webui/src/pages/Upload.tsx
index ae20b39b..1f0e5ce1 100644
--- a/backends/advanced/webui/src/pages/Upload.tsx
+++ b/backends/advanced/webui/src/pages/Upload.tsx
@@ -370,7 +370,6 @@ export default function Upload() {
           📝 Upload Instructions
         </h3>
         <ul className="text-sm text-yellow-700 dark:text-yellow-300 space-y-1">
-          <li>• Hello world</li>
           <li>• Audio files will be processed sequentially for transcription and memory extraction</li>
           <li>• Processing time varies based on audio length (roughly 3x the audio duration + 60s)</li>
           <li>• Large files or multiple files may cause timeout errors - this is normal</li>

From 5abd99d83dcf59c37ba7b2295a792ddee67f19e2 Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Mon, 8 Dec 2025 17:09:32 +0530
Subject: [PATCH 04/10] REFACTOR: minor refactor as per review

---
 .../utils/gdrive_audio_utils.py               | 21 +++++++------------
 1 file changed, 8 insertions(+), 13 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
index 6ce4c411..398a1427 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
@@ -15,10 +15,7 @@ class AudioValidationError(Exception):
     pass
 
 
-# -------------------------------------------------------------
-# DOWNLOAD A SINGLE FILE (OAUTH)
-# -------------------------------------------------------------
-async def download_and_wrap_drive_file(service, file_item):
+def download_and_wrap_drive_file(service, file_item):
     file_id = file_item["id"]
     name = file_item["name"]
 
@@ -29,7 +26,7 @@ async def download_and_wrap_drive_file(service, file_item):
 
     done = False
     while not done:
-        status, done = downloader.next_chunk()
+        _status, done = downloader.next_chunk()
 
     content = fh.getvalue()
 
@@ -47,20 +44,17 @@ def wrapped_close():
         try:
             original_close()
         finally:
-            try:
-                os.unlink(tmp_file.name)
-            except FileNotFoundError:
-                pass
+            # SpooledTemporaryFile auto-cleans when closed; no unlink needed
+            pass
 
     upload_file.close = wrapped_close
 
     return upload_file
 
-
 # -------------------------------------------------------------
 # LIST + DOWNLOAD FILES IN FOLDER (OAUTH)
 # -------------------------------------------------------------
-async def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploadFile]:
+def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploadFile]:
     if not folder_id:
         raise AudioValidationError("Google Drive folder ID is required.")
 
@@ -88,11 +82,12 @@ async def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploa
 
         wrapped_files = []
         for item in audio_files:
-            wrapped_files.append(await download_and_wrap_drive_file(service, item))
+            # synchronous call now
+            wrapped_files.append(download_and_wrap_drive_file(service, item))
 
         return wrapped_files
 
     except Exception as e:
         if isinstance(e, AudioValidationError):
             raise
-        raise AudioValidationError(f"Google Drive API Error: {repr(e)}")
+        raise AudioValidationError(f"Google Drive API Error: {e}") from e
\ No newline at end of file

From 3d00bac95b818ef0486460a1fe322237e205703d Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Mon, 8 Dec 2025 17:34:23 +0530
Subject: [PATCH 05/10] REFACTOR: minor update as per review

---
 .../src/advanced_omi_backend/utils/gdrive_audio_utils.py       | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
index 398a1427..49143281 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
@@ -61,7 +61,8 @@ def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploadFile]
     service = get_app_config().get_gdrive_service()
 
     try:
-        query = f"'{folder_id}' in parents and trashed = false"
+        escaped_folder_id = folder_id.replace("\\", "\\\\").replace("'", "\\'")
+        query = f"'{escaped_folder_id}' in parents and trashed = false"
 
         response = service.files().list(
             q=query,

From b0361854c8693283ffc0229b26565563b339da44 Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Tue, 9 Dec 2025 16:56:47 +0530
Subject: [PATCH 06/10] UPDATE: gdrive sync logic

---
 .../controllers/audio_controller.py           |  7 ++-
 .../advanced_omi_backend/models/audio_file.py |  6 ++-
 .../advanced_omi_backend/utils/audio_utils.py |  6 ++-
 .../utils/gdrive_audio_utils.py               | 49 +++++++++++++++----
 4 files changed, 53 insertions(+), 15 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
index da884eb6..2f1d5513 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
@@ -81,6 +81,8 @@ async def upload_and_process_audio_files(
                 # Read file content
                 content = await file.read()
 
+                gdrive_file_id = getattr(file, "gdrive_file_id", None)
+
                 # Generate audio UUID and timestamp
                 audio_uuid = str(uuid.uuid4())
                 timestamp = int(time.time() * 1000)
@@ -103,7 +105,8 @@ async def upload_and_process_audio_files(
                         user_email=user.email,
                         timestamp=timestamp,
                         chunk_dir=chunk_dir,
-                        validate=True  # Validate WAV format, convert stereo→mono
+                        validate=True,  # Validate WAV format, convert stereo→mono
+                        gdrive_file_id=gdrive_file_id
                     )
                 except AudioValidationError as e:
                     processed_files.append({
@@ -133,7 +136,7 @@ async def upload_and_process_audio_files(
                 # Use the relative path returned by write_audio_file (already includes folder prefix if applicable)
                 conversation.audio_path = relative_audio_path
                 await conversation.insert()
-                conversation_id = conversation.conversation_id  # Get the auto-generated ID
+                conversation_id = conversation.conversation_id  # Get the auto-gener    ated ID
 
                 audio_logger.info(f"📝 Created conversation {conversation_id} for uploaded file")
 
diff --git a/backends/advanced/src/advanced_omi_backend/models/audio_file.py b/backends/advanced/src/advanced_omi_backend/models/audio_file.py
index de1c6f3f..6d2efa4c 100644
--- a/backends/advanced/src/advanced_omi_backend/models/audio_file.py
+++ b/backends/advanced/src/advanced_omi_backend/models/audio_file.py
@@ -51,11 +51,15 @@ class AudioFile(Document):
         description="Speech detection results"
     )
 
+    gdrive_file_id: Optional[str] = Field(default=None, description="Google Drive file id")
+
+
     class Settings:
         name = "audio_chunks"
         indexes = [
             "audio_uuid",
             "client_id",
             "user_id",
-            "timestamp"
+            "timestamp", 
+            "gdrive_file_id"
         ]
\ No newline at end of file
diff --git a/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
index c6e5bfea..84e4e47d 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
@@ -107,7 +107,8 @@ async def write_audio_file(
     user_email: str,
     timestamp: int,
     chunk_dir: Optional[Path] = None,
-    validate: bool = True
+    validate: bool = True,
+    gdrive_file_id: Optional[str] = None,
 ) -> tuple[str, str, float]:
     """
     Validate, write audio data to WAV file, and create AudioSession database entry.
@@ -203,7 +204,8 @@ async def write_audio_file(
         user_id=user_id,
         user_email=user_email,
         has_speech=False,  # Will be updated by transcription
-        speech_analysis={}
+        speech_analysis={}, 
+        gdrive_file_id=gdrive_file_id
     )
     await audio_file.insert()
 
diff --git a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
index 49143281..dbd3ec99 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
@@ -1,12 +1,14 @@
-import os
 import io
 import tempfile
-import atexit
 from typing import List
+import logging
 from starlette.datastructures import UploadFile as StarletteUploadFile
 from googleapiclient.http import MediaIoBaseDownload
 from advanced_omi_backend.app_config import get_app_config
 
+logger = logging.getLogger(__name__)
+audio_logger = logging.getLogger("audio_processing")
+
 AUDIO_EXTENSIONS = (".wav", ".mp3", ".flac", ".ogg", ".m4a")
 FOLDER_MIMETYPE = "application/vnd.google-apps.folder"
 
@@ -15,7 +17,7 @@ class AudioValidationError(Exception):
     pass
 
 
-def download_and_wrap_drive_file(service, file_item):
+async def download_and_wrap_drive_file(service, file_item):
     file_id = file_item["id"]
     name = file_item["name"]
 
@@ -54,7 +56,7 @@ def wrapped_close():
 # -------------------------------------------------------------
 # LIST + DOWNLOAD FILES IN FOLDER (OAUTH)
 # -------------------------------------------------------------
-def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploadFile]:
+async def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploadFile]:
     if not folder_id:
         raise AudioValidationError("Google Drive folder ID is required.")
 
@@ -73,22 +75,49 @@ def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploadFile]
 
         all_files = response.get("files", [])
 
-        audio_files = [
+        audio_files_metadata = [
             f for f in all_files
             if f["name"].lower().endswith(AUDIO_EXTENSIONS)
         ]
 
-        if not audio_files:
+        if not audio_files_metadata:
             raise AudioValidationError("No audio files found in folder.")
 
         wrapped_files = []
-        for item in audio_files:
-            # synchronous call now
-            wrapped_files.append(download_and_wrap_drive_file(service, item))
+        skipped_count = 0
+        
+        for item in audio_files_metadata:
+            file_id = item["id"] # Get the Google Drive File ID
+            
+            #  Check if the file is already processed
+            if await is_drive_file_already_processed(file_id):
+                audio_logger.info(f"Skipping already processed file: {item['name']}") # Use your logger
+                skipped_count += 1
+                continue
+
+            # synchronous call now (but make the parent function async)
+            wrapped_file = await download_and_wrap_drive_file(service, item)
+            #  Attach the file_id to the UploadFile object for later use
+            setattr(wrapped_file, "gdrive_file_id", file_id) 
+            wrapped_files.append(wrapped_file)
+            
+        if not wrapped_files and skipped_count > 0:
+            raise AudioValidationError(f"All {skipped_count} files in the folder have already been processed.")
 
         return wrapped_files
 
     except Exception as e:
         if isinstance(e, AudioValidationError):
             raise
-        raise AudioValidationError(f"Google Drive API Error: {e}") from e
\ No newline at end of file
+        raise AudioValidationError(f"Google Drive API Error: {e}") from e
+    
+
+async def is_drive_file_already_processed(gdrive_file_id: str) -> bool:
+    """Check if an AudioFile document already exists for the given GDrive File ID."""
+    if not gdrive_file_id:
+        return False
+    from advanced_omi_backend.models.audio_file import AudioFile     
+    existing_file = await AudioFile.find_one(
+        AudioFile.gdrive_file_id == gdrive_file_id
+    )
+    return existing_file is not None
\ No newline at end of file

From cff1a4cf7388f0ed6f48ee6756fb05517b76960a Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Wed, 10 Dec 2025 11:53:37 +0530
Subject: [PATCH 07/10] REFACTOR: code update as per gdrive and update
 credential client

---
 .../src/advanced_omi_backend/app_config.py    |  21 --
 .../clients/gdrive_audio_client.py            |  29 +++
 .../routers/modules/audio_routes.py           |   6 +-
 .../utils/gdrive_audio_utils.py               |   4 +-
 backends/advanced/webui/src/pages/Upload.tsx  | 241 +++++++++---------
 backends/advanced/webui/src/services/api.ts   |  10 +-
 6 files changed, 157 insertions(+), 154 deletions(-)
 create mode 100644 backends/advanced/src/advanced_omi_backend/clients/gdrive_audio_client.py

diff --git a/backends/advanced/src/advanced_omi_backend/app_config.py b/backends/advanced/src/advanced_omi_backend/app_config.py
index 330028a7..0cd087a7 100644
--- a/backends/advanced/src/advanced_omi_backend/app_config.py
+++ b/backends/advanced/src/advanced_omi_backend/app_config.py
@@ -87,27 +87,6 @@ def __init__(self):
 
         self.gdrive_credentials_path = "data/gdrive_service_account.json"
         self.gdrive_scopes = ["https://www.googleapis.com/auth/drive.readonly"]
-        self._gdrive_service = None
-
-    def get_gdrive_service(self):
-        """Return Google Drive API client using stored service account."""
-        from google.oauth2.service_account import Credentials
-        from googleapiclient.discovery import build
-        if self._gdrive_service:
-            return self._gdrive_service
-
-        if not os.path.exists(self.gdrive_credentials_path):
-            raise FileNotFoundError(
-                f"Missing Google Drive credentials at {self.gdrive_credentials_path}"
-            )
-
-        creds = Credentials.from_service_account_file(
-            self.gdrive_credentials_path,
-            scopes=self.gdrive_scopes,
-        )
-
-        self._gdrive_service = build("drive", "v3", credentials=creds)
-        return self._gdrive_service
 
 
 # Global configuration instance
diff --git a/backends/advanced/src/advanced_omi_backend/clients/gdrive_audio_client.py b/backends/advanced/src/advanced_omi_backend/clients/gdrive_audio_client.py
new file mode 100644
index 00000000..5a6271e1
--- /dev/null
+++ b/backends/advanced/src/advanced_omi_backend/clients/gdrive_audio_client.py
@@ -0,0 +1,29 @@
+import os 
+from google.oauth2.service_account import Credentials
+from googleapiclient.discovery import build
+from advanced_omi_backend.app_config import get_app_config
+
+_drive_client_cache = None
+
+def get_google_drive_client():
+    """Singleton Google Drive client."""
+    global _drive_client_cache
+
+    if _drive_client_cache:
+        return _drive_client_cache
+
+    config = get_app_config()
+
+    if not os.path.exists(config.gdrive_credentials_path):
+        raise FileNotFoundError(
+            f"Missing Google Drive credentials at {config.gdrive_credentials_path}"
+        )
+
+    creds = Credentials.from_service_account_file(
+        config.gdrive_credentials_path,
+        scopes=config.gdrive_scopes
+    )
+
+    _drive_client_cache = build("drive", "v3", credentials=creds)
+
+    return _drive_client_cache
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
index b8605fea..e8ba091f 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
@@ -17,14 +17,14 @@
 router = APIRouter(prefix="/audio", tags=["audio"])
 
 
-@router.post("/upload_audio_from_url")
+@router.post("/upload_audio_from_gdrive")
 async def upload_audio_from_drive_folder(
-    drive_folder_id: str = Query(...,alias="url", description="Google Drive Folder ID containing audio files (e.g., the string after /folders/ in the URL)"),
+    gdrive_folder_id: str = Query(..., description="Google Drive Folder ID containing audio files (e.g., the string after /folders/ in the URL)"),
     current_user: User = Depends(current_superuser),
     device_name: str = Query(default="upload"),
     auto_generate_client: bool = Query(default=True),
 ):
-    files = await download_audio_files_from_drive(drive_folder_id)
+    files = await download_audio_files_from_drive(gdrive_folder_id)
 
     return await audio_controller.upload_and_process_audio_files(
         current_user, files, device_name, auto_generate_client
diff --git a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
index dbd3ec99..2b6efd8d 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
@@ -5,6 +5,8 @@
 from starlette.datastructures import UploadFile as StarletteUploadFile
 from googleapiclient.http import MediaIoBaseDownload
 from advanced_omi_backend.app_config import get_app_config
+from advanced_omi_backend.clients.gdrive_audio_client import get_google_drive_client
+
 
 logger = logging.getLogger(__name__)
 audio_logger = logging.getLogger("audio_processing")
@@ -60,7 +62,7 @@ async def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploa
     if not folder_id:
         raise AudioValidationError("Google Drive folder ID is required.")
 
-    service = get_app_config().get_gdrive_service()
+    service = get_google_drive_client()
 
     try:
         escaped_folder_id = folder_id.replace("\\", "\\\\").replace("'", "\\'")
diff --git a/backends/advanced/webui/src/pages/Upload.tsx b/backends/advanced/webui/src/pages/Upload.tsx
index 1f0e5ce1..c32ee396 100644
--- a/backends/advanced/webui/src/pages/Upload.tsx
+++ b/backends/advanced/webui/src/pages/Upload.tsx
@@ -15,85 +15,80 @@ export default function Upload() {
   const [isUploading, setIsUploading] = useState(false)
   const [dragActive, setDragActive] = useState(false)
   const [uploadProgress, setUploadProgress] = useState(0)
-  const [audioUrl, setAudioUrl] = useState('')
+  const [gdriveFolderId, setGdriveFolderId] = useState('')
 
   const { isAdmin } = useAuth()
 
   const generateId = () => Math.random().toString(36).substr(2, 9)
 
-  const [urlUploadStatus, setUrlUploadStatus] = useState<{
-  type: 'success' | 'error' | null
-  message: string
-}>({ type: null, message: '' })
+  const [gdriveUploadStatus, setGdriveUploadStatus] = useState<{
+    type: 'success' | 'error' | null
+    message: string
+  }>({
+    type: null,
+    message: ''
+  })
 
+  // Handle Google Drive folder submission
+  const handleGDriveSubmit = async () => {
+    if (!gdriveFolderId) return
 
-  // Handle URL submission
-  const handleUrlSubmit = async () => {
-  if (!audioUrl) return
-
-  setIsUploading(true)
-  setUrlUploadStatus({ type: null, message: '' })
-
-  try {
-    const response = await uploadApi.uploadAudioFromUrl({
-      drive_folder_id: audioUrl,
-      device_name: 'upload',
-      auto_generate_client: true,
-    })
-
-    console.log('URL Upload response:', response)
+    setIsUploading(true)
+    setGdriveUploadStatus({ type: null, message: '' })
 
-    setUrlUploadStatus({
-      type: 'success',
-      message: `Audio submitted successfully`,
-    })
+    try {
+      await uploadApi.uploadFromGDriveFolder({
+        gdrive_folder_id: gdriveFolderId,
+        device_name: 'upload',
+        auto_generate_client: true,
+      })
 
-    setAudioUrl('')
-  } catch (err: any) {
-    console.error('URL upload failed:', err)
+      setGdriveUploadStatus({
+        type: 'success',
+        message: 'Google Drive folder submitted successfully.',
+      })
 
-    setUrlUploadStatus({
-      type: 'error',
-      message:
-        err?.response?.data?.detail || 'Failed to upload audio from URL',
-    })
-  } finally {
-    setIsUploading(false)
+      setGdriveFolderId('')
+    } catch (err: any) {
+      setGdriveUploadStatus({
+        type: 'error',
+        message: err?.response?.data?.detail || 'Failed to upload folder.',
+      })
+    } finally {
+      setIsUploading(false)
+    }
   }
-}
 
   const handleFileSelect = (selectedFiles: FileList | null) => {
     if (!selectedFiles) return
 
-    const audioFiles = Array.from(selectedFiles).filter(file => 
-      file.type.startsWith('audio/') || 
-      file.name.toLowerCase().endsWith('.wav') ||
-      file.name.toLowerCase().endsWith('.mp3') ||
-      file.name.toLowerCase().endsWith('.m4a') ||
-      file.name.toLowerCase().endsWith('.flac')
+    const audioFiles = Array.from(selectedFiles).filter(
+      (file) =>
+        file.type.startsWith('audio/') ||
+        file.name.toLowerCase().endsWith('.wav') ||
+        file.name.toLowerCase().endsWith('.mp3') ||
+        file.name.toLowerCase().endsWith('.m4a') ||
+        file.name.toLowerCase().endsWith('.flac')
     )
 
-    const newFiles: UploadFile[] = audioFiles.map(file => ({
+    const newFiles: UploadFile[] = audioFiles.map((file) => ({
       file,
       id: generateId(),
-      status: 'pending'
+      status: 'pending',
     }))
 
-    setFiles(prevFiles => [...prevFiles, ...newFiles])
+    setFiles((prev) => [...prev, ...newFiles])
   }
 
   const removeFile = (id: string) => {
-    setFiles(files.filter(f => f.id !== id))
+    setFiles(files.filter((f) => f.id !== id))
   }
 
   const handleDrag = useCallback((e: React.DragEvent) => {
     e.preventDefault()
     e.stopPropagation()
-    if (e.type === 'dragenter' || e.type === 'dragover') {
-      setDragActive(true)
-    } else if (e.type === 'dragleave') {
-      setDragActive(false)
-    }
+    if (e.type === 'dragenter' || e.type === 'dragover') setDragActive(true)
+    else if (e.type === 'dragleave') setDragActive(false)
   }, [])
 
   const handleDrop = useCallback((e: React.DragEvent) => {
@@ -115,29 +110,25 @@ export default function Upload() {
         formData.append('files', file)
       })
 
-      // Update all files to uploading status
-      setFiles(prevFiles => 
-        prevFiles.map(f => ({ ...f, status: 'uploading' as const }))
+      setFiles((prev) =>
+        prev.map((f) => ({ ...f, status: 'uploading' }))
       )
 
       await uploadApi.uploadAudioFiles(formData, (progress) => {
         setUploadProgress(progress)
       })
-      
-      // Mark all files as successful
-      setFiles(prevFiles => 
-        prevFiles.map(f => ({ ...f, status: 'success' as const }))
-      )
 
-    } catch (error: any) {
-      console.error('Upload failed:', error)
-      
-      // Mark all files as failed
-      setFiles(prevFiles => 
-        prevFiles.map(f => ({ 
-          ...f, 
-          status: 'error' as const, 
-          error: error.message || 'Upload failed' 
+      setFiles((prev) =>
+        prev.map((f) => ({ ...f, status: 'success' }))
+      )
+    } catch (err: any) {
+      console.error('Upload failed:', err)
+
+      setFiles((prev) =>
+        prev.map((f) => ({
+          ...f,
+          status: 'error',
+          error: err.message || 'Upload failed',
         }))
       )
     } finally {
@@ -147,7 +138,7 @@ export default function Upload() {
   }
 
   const clearCompleted = () => {
-    setFiles(files.filter(f => f.status === 'pending' || f.status === 'uploading'))
+    setFiles(files.filter((f) => f.status === 'pending' || f.status === 'uploading'))
   }
 
   const formatFileSize = (bytes: number) => {
@@ -155,7 +146,7 @@ export default function Upload() {
     const k = 1024
     const sizes = ['Bytes', 'KB', 'MB', 'GB']
     const i = Math.floor(Math.log(bytes) / Math.log(k))
-    return parseFloat((bytes / Math.pow(k, i)).toFixed(2)) + ' ' + sizes[i]
+    return `${(bytes / Math.pow(k, i)).toFixed(2)} ${sizes[i]}`
   }
 
   const getStatusIcon = (status: UploadFile['status']) => {
@@ -194,44 +185,43 @@ export default function Upload() {
           Upload Audio Files
         </h1>
       </div>
-      {/* URL Input */}
+
+      {/* Google Drive Folder Upload */}
       <div className="mb-6 p-4 bg-gray-50 dark:bg-gray-700 rounded-lg border border-gray-200 dark:border-gray-600">
-  <label className="block mb-2 font-medium text-gray-900 dark:text-gray-100">
-    Paste audio URL:
-  </label>
-
-  <div className="flex space-x-2">
-    <input
-      type="text"
-      value={audioUrl}
-      onChange={(e) => setAudioUrl(e.target.value)}
-      placeholder="https://example.com/audio.wav"
-      className="flex-1 px-3 py-2 border rounded-lg dark:bg-gray-800 dark:text-gray-100"
-    />
-
-    <button
-      onClick={handleUrlSubmit}
-      disabled={isUploading || !audioUrl}
-      className="px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700 disabled:opacity-50 disabled:cursor-not-allowed"
-    >
-      {isUploading ? 'Submitting...' : 'Submit URL'}
-    </button>
-  </div>
-
-  {/* ✅ Add the status message here */}
-  {urlUploadStatus.type && (
-    <div
-      className={`mt-3 p-3 rounded-lg text-sm ${
-        urlUploadStatus.type === 'success'
-          ? 'bg-green-100 text-green-800 border border-green-300'
-          : 'bg-red-100 text-red-800 border border-red-300'
-      }`}
-    >
-      {urlUploadStatus.message}
-    </div>
-  )}
-</div>
+        <label className="block mb-2 font-medium text-gray-900 dark:text-gray-100">
+          Paste Google Drive Folder ID:
+        </label>
+
+        <div className="flex space-x-2">
+          <input
+            type="text"
+            value={gdriveFolderId}
+            onChange={(e) => setGdriveFolderId(e.target.value)}
+            placeholder="1AbCdEfGhIjKlMnOpQrStUvWxYz123456"
+            className="flex-1 px-3 py-2 border rounded-lg dark:bg-gray-800 dark:text-gray-100"
+          />
+
+          <button
+            onClick={handleGDriveSubmit}
+            disabled={isUploading || !gdriveFolderId}
+            className="px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700 disabled:opacity-50"
+          >
+            {isUploading ? 'Submitting...' : 'Submit Folder'}
+          </button>
+        </div>
 
+        {gdriveUploadStatus.type && (
+          <div
+            className={`mt-3 p-3 rounded-lg text-sm ${
+              gdriveUploadStatus.type === 'success'
+                ? 'bg-green-100 text-green-800 border border-green-300'
+                : 'bg-red-100 text-red-800 border border-red-300'
+            }`}
+          >
+            {gdriveUploadStatus.message}
+          </div>
+        )}
+      </div>
 
       {/* Drop Zone */}
       <div
@@ -252,7 +242,7 @@ export default function Upload() {
         <p className="text-sm text-gray-600 dark:text-gray-400 mb-4">
           Supported formats: WAV, MP3, M4A, FLAC
         </p>
-        
+
         <input
           type="file"
           multiple
@@ -260,10 +250,10 @@ export default function Upload() {
           onChange={(e) => handleFileSelect(e.target.files)}
           className="absolute inset-0 w-full h-full opacity-0 cursor-pointer"
         />
-        
+
         <button
           onClick={() => (document.querySelector('input[type="file"]') as HTMLInputElement)?.click()}
-          className="px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700 transition-colors"
+          className="px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700"
         >
           Select Files
         </button>
@@ -279,14 +269,14 @@ export default function Upload() {
             <div className="flex space-x-2">
               <button
                 onClick={clearCompleted}
-                className="px-3 py-1 text-sm bg-gray-600 text-white rounded hover:bg-gray-700 transition-colors"
+                className="px-3 py-1 text-sm bg-gray-600 text-white rounded hover:bg-gray-700"
               >
                 Clear Completed
               </button>
               <button
                 onClick={uploadFiles}
-                disabled={isUploading || files.every(f => f.status !== 'pending')}
-                className="px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700 transition-colors disabled:opacity-50 disabled:cursor-not-allowed"
+                disabled={isUploading || files.every((f) => f.status !== 'pending')}
+                className="px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700 disabled:opacity-50"
               >
                 {isUploading ? 'Uploading...' : 'Upload All'}
               </button>
@@ -317,19 +307,24 @@ export default function Upload() {
                 </div>
 
                 <div className="flex items-center space-x-2">
-                  <span className={`text-sm font-medium ${
-                    uploadFile.status === 'success' ? 'text-green-600' :
-                    uploadFile.status === 'error' ? 'text-red-600' :
-                    uploadFile.status === 'uploading' ? 'text-blue-600' :
-                    'text-gray-600 dark:text-gray-400'
-                  }`}>
+                  <span
+                    className={`text-sm font-medium ${
+                      uploadFile.status === 'success'
+                        ? 'text-green-600'
+                        : uploadFile.status === 'error'
+                        ? 'text-red-600'
+                        : uploadFile.status === 'uploading'
+                        ? 'text-blue-600'
+                        : 'text-gray-600 dark:text-gray-400'
+                    }`}
+                  >
                     {uploadFile.status.charAt(0).toUpperCase() + uploadFile.status.slice(1)}
                   </span>
-                  
+
                   {uploadFile.status === 'pending' && (
                     <button
                       onClick={() => removeFile(uploadFile.id)}
-                      className="p-1 text-red-600 hover:bg-red-50 dark:hover:bg-red-900/20 rounded transition-colors"
+                      className="p-1 text-red-600 hover:bg-red-50 dark:hover:bg-red-900/20 rounded"
                     >
                       <X className="h-4 w-4" />
                     </button>
@@ -371,12 +366,12 @@ export default function Upload() {
         </h3>
         <ul className="text-sm text-yellow-700 dark:text-yellow-300 space-y-1">
           <li>• Audio files will be processed sequentially for transcription and memory extraction</li>
-          <li>• Processing time varies based on audio length (roughly 3x the audio duration + 60s)</li>
-          <li>• Large files or multiple files may cause timeout errors - this is normal</li>
-          <li>• Check the Conversations tab to see processed results</li>
+          <li>• Processing time varies based on audio length (roughly 3× duration + 60s)</li>
+          <li>• Large files or multiple files may cause timeout errors</li>
+          <li>• Check the Conversations tab for processed results</li>
           <li>• Supported formats: WAV, MP3, M4A, FLAC</li>
         </ul>
       </div>
     </div>
   )
-}
\ No newline at end of file
+}
diff --git a/backends/advanced/webui/src/services/api.ts b/backends/advanced/webui/src/services/api.ts
index 3c16f173..86bf655d 100644
--- a/backends/advanced/webui/src/services/api.ts
+++ b/backends/advanced/webui/src/services/api.ts
@@ -191,12 +191,10 @@ export const uploadApi = {
       },
     }),
 
-uploadAudioFromUrl: (payload: { drive_folder_id: string; device_name?: string; auto_generate_client?: boolean }) =>
-    // 1. Set the POST body to null (or leave it out, though explicit null is cleaner for no body)
-    api.post('/api/audio/upload_audio_from_url', null, { 
-      // 2. Pass the entire payload object to the 'params' configuration key
-      params: { 
-        url: payload.drive_folder_id, // IMPORTANT: Use 'url' here to match the backend's alias
+  uploadFromGDriveFolder: (payload: { gdrive_folder_id: string; device_name?: string; auto_generate_client?: boolean }) =>
+    api.post('/api/audio/upload_audio_from_gdrive', null, {
+      params: {
+        gdrive_folder_id: payload.gdrive_folder_id,
         device_name: payload.device_name,
         auto_generate_client: payload.auto_generate_client,
       },

From 6534288efae767d48947009950bab924fe8eac26 Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Wed, 10 Dec 2025 12:23:19 +0530
Subject: [PATCH 08/10] REFACTOR: validation updated - as per review from CR

---
 .../advanced_omi_backend/routers/modules/audio_routes.py | 7 +++++--
 .../src/advanced_omi_backend/utils/gdrive_audio_utils.py | 9 +++------
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
index e8ba091f..6da6f9b2 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
@@ -12,7 +12,7 @@
 from advanced_omi_backend.controllers import audio_controller
 from advanced_omi_backend.models.user import User
 from advanced_omi_backend.app_config import get_audio_chunk_dir
-from advanced_omi_backend.utils.gdrive_audio_utils import download_audio_files_from_drive
+from advanced_omi_backend.utils.gdrive_audio_utils import download_audio_files_from_drive, AudioValidationError
 
 router = APIRouter(prefix="/audio", tags=["audio"])
 
@@ -24,7 +24,10 @@ async def upload_audio_from_drive_folder(
     device_name: str = Query(default="upload"),
     auto_generate_client: bool = Query(default=True),
 ):
-    files = await download_audio_files_from_drive(gdrive_folder_id)
+    try: 
+        files = await download_audio_files_from_drive(gdrive_folder_id)
+    except AudioValidationError as e: 
+        raise HTTPException(status_code=400, detail=str(e))
 
     return await audio_controller.upload_and_process_audio_files(
         current_user, files, device_name, auto_generate_client
diff --git a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
index 2b6efd8d..09c3da17 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
@@ -4,8 +4,9 @@
 import logging
 from starlette.datastructures import UploadFile as StarletteUploadFile
 from googleapiclient.http import MediaIoBaseDownload
-from advanced_omi_backend.app_config import get_app_config
 from advanced_omi_backend.clients.gdrive_audio_client import get_google_drive_client
+from advanced_omi_backend.models.audio_file import AudioFile
+from advanced_omi_backend.utils.audio_utils import AudioValidationError
 
 
 logger = logging.getLogger(__name__)
@@ -15,9 +16,6 @@
 FOLDER_MIMETYPE = "application/vnd.google-apps.folder"
 
 
-class AudioValidationError(Exception):
-    pass
-
 
 async def download_and_wrap_drive_file(service, file_item):
     file_id = file_item["id"]
@@ -100,7 +98,7 @@ async def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploa
             # synchronous call now (but make the parent function async)
             wrapped_file = await download_and_wrap_drive_file(service, item)
             #  Attach the file_id to the UploadFile object for later use
-            setattr(wrapped_file, "gdrive_file_id", file_id) 
+            wrapped_file.gdrive_file_id = file_id
             wrapped_files.append(wrapped_file)
             
         if not wrapped_files and skipped_count > 0:
@@ -118,7 +116,6 @@ async def is_drive_file_already_processed(gdrive_file_id: str) -> bool:
     """Check if an AudioFile document already exists for the given GDrive File ID."""
     if not gdrive_file_id:
         return False
-    from advanced_omi_backend.models.audio_file import AudioFile     
     existing_file = await AudioFile.find_one(
         AudioFile.gdrive_file_id == gdrive_file_id
     )

From 1ff28cbcc4f83c18704feaff10f2e5636d643a70 Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Mon, 15 Dec 2025 16:32:51 +0530
Subject: [PATCH 09/10] UPDATE: code has been refactore for UUID for diffrent
 audio upload sources

---
 .../controllers/audio_controller.py           |   9 +-
 .../advanced_omi_backend/models/audio_file.py |   6 +-
 .../routers/modules/audio_routes.py           |   2 +-
 .../advanced_omi_backend/utils/audio_utils.py |   4 +-
 .../utils/dropbox_audio_utils.py              | 150 ++++++++++++++++++
 .../utils/gdrive_audio_utils.py               |  19 +--
 6 files changed, 171 insertions(+), 19 deletions(-)
 create mode 100644 backends/advanced/src/advanced_omi_backend/utils/dropbox_audio_utils.py

diff --git a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
index 2f1d5513..06492ff2 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
@@ -40,6 +40,7 @@ async def upload_and_process_audio_files(
     device_name: str = "upload",
     auto_generate_client: bool = True,
     folder: str = None,
+    source: str = "upload"
 ) -> dict:
     """
     Upload audio files and process them directly.
@@ -81,10 +82,12 @@ async def upload_and_process_audio_files(
                 # Read file content
                 content = await file.read()
 
-                gdrive_file_id = getattr(file, "gdrive_file_id", None)
 
                 # Generate audio UUID and timestamp
-                audio_uuid = str(uuid.uuid4())
+                if source == "gdrive":
+                    audio_uuid = getattr(file, "audio_uuid", None)
+                else: 
+                    audio_uuid = str(uuid.uuid4())
                 timestamp = int(time.time() * 1000)
 
                 # Determine output directory (with optional subfolder)
@@ -100,13 +103,13 @@ async def upload_and_process_audio_files(
                     relative_audio_path, file_path, duration = await write_audio_file(
                         raw_audio_data=content,
                         audio_uuid=audio_uuid,
+                        source=source,
                         client_id=client_id,
                         user_id=user.user_id,
                         user_email=user.email,
                         timestamp=timestamp,
                         chunk_dir=chunk_dir,
                         validate=True,  # Validate WAV format, convert stereo→mono
-                        gdrive_file_id=gdrive_file_id
                     )
                 except AudioValidationError as e:
                     processed_files.append({
diff --git a/backends/advanced/src/advanced_omi_backend/models/audio_file.py b/backends/advanced/src/advanced_omi_backend/models/audio_file.py
index 6d2efa4c..3e8cc4b3 100644
--- a/backends/advanced/src/advanced_omi_backend/models/audio_file.py
+++ b/backends/advanced/src/advanced_omi_backend/models/audio_file.py
@@ -29,6 +29,10 @@ class AudioFile(Document):
 
     # Core identifiers
     audio_uuid: Indexed(str, unique=True) = Field(description="Unique audio identifier")
+    source: Indexed(str) = Field(
+        default="upload",
+        description="Source of the audio (upload, gdrive, etc.)"
+    )
     audio_path: str = Field(description="Path to raw audio file")
     client_id: Indexed(str) = Field(description="Client device identifier")
     timestamp: Indexed(int) = Field(description="Unix timestamp in milliseconds")
@@ -51,7 +55,6 @@ class AudioFile(Document):
         description="Speech detection results"
     )
 
-    gdrive_file_id: Optional[str] = Field(default=None, description="Google Drive file id")
 
 
     class Settings:
@@ -61,5 +64,4 @@ class Settings:
             "client_id",
             "user_id",
             "timestamp", 
-            "gdrive_file_id"
         ]
\ No newline at end of file
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
index 6da6f9b2..056e7667 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
@@ -30,7 +30,7 @@ async def upload_audio_from_drive_folder(
         raise HTTPException(status_code=400, detail=str(e))
 
     return await audio_controller.upload_and_process_audio_files(
-        current_user, files, device_name, auto_generate_client
+        current_user, files, device_name, auto_generate_client, source="gdrive"
     )
 
 
diff --git a/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
index 84e4e47d..3a3b554d 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
@@ -102,13 +102,13 @@ async def validate_and_prepare_audio(
 async def write_audio_file(
     raw_audio_data: bytes,
     audio_uuid: str,
+    source: str,
     client_id: str,
     user_id: str,
     user_email: str,
     timestamp: int,
     chunk_dir: Optional[Path] = None,
     validate: bool = True,
-    gdrive_file_id: Optional[str] = None,
 ) -> tuple[str, str, float]:
     """
     Validate, write audio data to WAV file, and create AudioSession database entry.
@@ -198,6 +198,7 @@ async def write_audio_file(
     # Create AudioFile database entry using Beanie model
     audio_file = AudioFile(
         audio_uuid=audio_uuid,
+        source=source,
         audio_path=wav_filename,
         client_id=client_id,
         timestamp=timestamp,
@@ -205,7 +206,6 @@ async def write_audio_file(
         user_email=user_email,
         has_speech=False,  # Will be updated by transcription
         speech_analysis={}, 
-        gdrive_file_id=gdrive_file_id
     )
     await audio_file.insert()
 
diff --git a/backends/advanced/src/advanced_omi_backend/utils/dropbox_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/dropbox_audio_utils.py
new file mode 100644
index 00000000..51de2c1b
--- /dev/null
+++ b/backends/advanced/src/advanced_omi_backend/utils/dropbox_audio_utils.py
@@ -0,0 +1,150 @@
+import io
+import tempfile
+from typing import List
+import logging
+from starlette.datastructures import UploadFile as StarletteUploadFile
+import requests
+from advanced_omi_backend.app_config import get_app_config
+
+logger = logging.getLogger(__name__)
+audio_logger = logging.getLogger("audio_processing")
+
+AUDIO_EXTENSIONS = (".wav", ".mp3", ".flac", ".ogg", ".m4a")
+
+class AudioValidationError(Exception):
+    pass
+
+
+async def download_and_wrap_dropbox_file(file_metadata: dict):
+    access_token = get_app_config().dropbox_access_token    
+    if not access_token:
+        raise AudioValidationError("Dropbox access token is missing.")
+
+    file_path = file_metadata["path_lower"]
+    name = file_metadata["name"]
+
+    headers = {
+        "Authorization": f"Bearer {access_token}",
+        "Dropbox-API-Arg": f'{{"path": "{file_path}"}}'
+    }
+
+    response = requests.post(
+        "https://content.dropboxapi.com/2/files/download",
+        headers=headers
+    )
+
+    if response.status_code != 200:
+        raise AudioValidationError(
+            f"Failed to download Dropbox file {name}: {response.text}"
+        )
+
+    content = response.content
+    if not content:
+        raise AudioValidationError(f"Downloaded Dropbox file '{name}' was empty")
+
+    tmp_file = tempfile.SpooledTemporaryFile(max_size=10 * 1024 * 1024)
+    tmp_file.write(content)
+    tmp_file.seek(0)
+
+    upload_file = StarletteUploadFile(filename=name, file=tmp_file)
+
+    original_close = upload_file.close
+
+    def wrapped_close():
+        try:
+            original_close()
+        finally:
+            pass
+
+    upload_file.close = wrapped_close
+    return upload_file
+
+
+async def download_audio_files_from_dropbox(folder_path: str) -> List[StarletteUploadFile]:
+    if not folder_path:
+        raise AudioValidationError("Dropbox folder path is required.")
+
+    access_token = get_app_config().dropbox_access_token
+    if not access_token:
+        raise AudioValidationError("Dropbox access token is missing.")
+
+    try:
+        # -----------------------------------------------
+        # Step 1: List files in folder
+        # -----------------------------------------------
+        list_headers = {
+            "Authorization": f"Bearer {access_token}",
+            "Content-Type": "application/json"
+        }
+
+        list_body = {
+            "path": folder_path,
+            "recursive": False
+        }
+
+        list_res = requests.post(
+            "https://api.dropboxapi.com/2/files/list_folder",
+            headers=list_headers,
+            json=list_body
+        )
+
+        if list_res.status_code != 200:
+            raise AudioValidationError(f"Dropbox API list_folder error: {list_res.text}")
+
+        items = list_res.json().get("entries", [])
+
+        # Filter audio files
+        audio_files_metadata = [
+            f for f in items
+            if f[".tag"] == "file" and f["name"].lower().endswith(AUDIO_EXTENSIONS)
+        ]
+
+        if not audio_files_metadata:
+            raise AudioValidationError("No audio files found in folder.")
+
+        wrapped_files = []
+        skipped_count = 0
+
+        # -----------------------------------------------
+        # Step 2: Download each audio file
+        # -----------------------------------------------
+        for item in audio_files_metadata:
+            dropbox_id = item["id"]  # Dropbox file ID
+
+            # Check if already processed
+            if await is_dropbox_file_already_processed(dropbox_id):
+                audio_logger.info(f"Skipping already processed file: {item['name']}")
+                skipped_count += 1
+                continue
+
+            wrapped_file = await download_and_wrap_dropbox_file(access_token, item)
+
+            # Attach Dropbox file ID
+            setattr(wrapped_file, "dropbox_file_id", dropbox_id)
+
+            wrapped_files.append(wrapped_file)
+
+        if not wrapped_files and skipped_count > 0:
+            raise AudioValidationError(
+                f"All {skipped_count} files in the folder have already been processed."
+            )
+
+        return wrapped_files
+
+    except Exception as e:
+        if isinstance(e, AudioValidationError):
+            raise
+        raise AudioValidationError(f"Dropbox API Error: {e}") from e
+
+
+async def is_dropbox_file_already_processed(dropbox_file_id: str) -> bool:
+    if not dropbox_file_id:
+        return False
+
+    from advanced_omi_backend.models.audio_file import AudioFile
+
+    existing_file = await AudioFile.find_one(
+        AudioFile.dropbox_file_id == dropbox_file_id
+    )
+
+    return existing_file is not None
diff --git a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
index 09c3da17..46b0806d 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/gdrive_audio_utils.py
@@ -90,15 +90,20 @@ async def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploa
             file_id = item["id"] # Get the Google Drive File ID
             
             #  Check if the file is already processed
-            if await is_drive_file_already_processed(file_id):
-                audio_logger.info(f"Skipping already processed file: {item['name']}") # Use your logger
+            existing = await AudioFile.find_one({
+                "audio_uuid": file_id,
+                "source": "gdrive"
+            })
+
+            if existing:
+                audio_logger.info(f"Skipping already processed file: {item['name']}")
                 skipped_count += 1
                 continue
 
             # synchronous call now (but make the parent function async)
             wrapped_file = await download_and_wrap_drive_file(service, item)
             #  Attach the file_id to the UploadFile object for later use
-            wrapped_file.gdrive_file_id = file_id
+            wrapped_file.audio_uuid = file_id
             wrapped_files.append(wrapped_file)
             
         if not wrapped_files and skipped_count > 0:
@@ -112,11 +117,3 @@ async def download_audio_files_from_drive(folder_id: str) -> List[StarletteUploa
         raise AudioValidationError(f"Google Drive API Error: {e}") from e
     
 
-async def is_drive_file_already_processed(gdrive_file_id: str) -> bool:
-    """Check if an AudioFile document already exists for the given GDrive File ID."""
-    if not gdrive_file_id:
-        return False
-    existing_file = await AudioFile.find_one(
-        AudioFile.gdrive_file_id == gdrive_file_id
-    )
-    return existing_file is not None
\ No newline at end of file

From 8e5a6b297ba5ba5e7391b00d3dea66052bb38cab Mon Sep 17 00:00:00 2001
From: 01PrathamS <pratham21btai35@karnavatiuniversity.edu.in>
Date: Mon, 15 Dec 2025 16:47:47 +0530
Subject: [PATCH 10/10] REFACTOR: updated code as per review

---
 .../controllers/audio_controller.py           |   5 +-
 .../utils/dropbox_audio_utils.py              | 150 ------------------
 2 files changed, 4 insertions(+), 151 deletions(-)
 delete mode 100644 backends/advanced/src/advanced_omi_backend/utils/dropbox_audio_utils.py

diff --git a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
index 06492ff2..4810810d 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
@@ -86,6 +86,9 @@ async def upload_and_process_audio_files(
                 # Generate audio UUID and timestamp
                 if source == "gdrive":
                     audio_uuid = getattr(file, "audio_uuid", None)
+                    if not audio_uuid: 
+                        audio_logger.error(f"Missing audio_uuid for gdrive file: {file.filename}")
+                        audio_uuid = str(uuid.uuid4()) 
                 else: 
                     audio_uuid = str(uuid.uuid4())
                 timestamp = int(time.time() * 1000)
@@ -139,7 +142,7 @@ async def upload_and_process_audio_files(
                 # Use the relative path returned by write_audio_file (already includes folder prefix if applicable)
                 conversation.audio_path = relative_audio_path
                 await conversation.insert()
-                conversation_id = conversation.conversation_id  # Get the auto-gener    ated ID
+                conversation_id = conversation.conversation_id  # Get the auto-generated ID
 
                 audio_logger.info(f"📝 Created conversation {conversation_id} for uploaded file")
 
diff --git a/backends/advanced/src/advanced_omi_backend/utils/dropbox_audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/dropbox_audio_utils.py
deleted file mode 100644
index 51de2c1b..00000000
--- a/backends/advanced/src/advanced_omi_backend/utils/dropbox_audio_utils.py
+++ /dev/null
@@ -1,150 +0,0 @@
-import io
-import tempfile
-from typing import List
-import logging
-from starlette.datastructures import UploadFile as StarletteUploadFile
-import requests
-from advanced_omi_backend.app_config import get_app_config
-
-logger = logging.getLogger(__name__)
-audio_logger = logging.getLogger("audio_processing")
-
-AUDIO_EXTENSIONS = (".wav", ".mp3", ".flac", ".ogg", ".m4a")
-
-class AudioValidationError(Exception):
-    pass
-
-
-async def download_and_wrap_dropbox_file(file_metadata: dict):
-    access_token = get_app_config().dropbox_access_token    
-    if not access_token:
-        raise AudioValidationError("Dropbox access token is missing.")
-
-    file_path = file_metadata["path_lower"]
-    name = file_metadata["name"]
-
-    headers = {
-        "Authorization": f"Bearer {access_token}",
-        "Dropbox-API-Arg": f'{{"path": "{file_path}"}}'
-    }
-
-    response = requests.post(
-        "https://content.dropboxapi.com/2/files/download",
-        headers=headers
-    )
-
-    if response.status_code != 200:
-        raise AudioValidationError(
-            f"Failed to download Dropbox file {name}: {response.text}"
-        )
-
-    content = response.content
-    if not content:
-        raise AudioValidationError(f"Downloaded Dropbox file '{name}' was empty")
-
-    tmp_file = tempfile.SpooledTemporaryFile(max_size=10 * 1024 * 1024)
-    tmp_file.write(content)
-    tmp_file.seek(0)
-
-    upload_file = StarletteUploadFile(filename=name, file=tmp_file)
-
-    original_close = upload_file.close
-
-    def wrapped_close():
-        try:
-            original_close()
-        finally:
-            pass
-
-    upload_file.close = wrapped_close
-    return upload_file
-
-
-async def download_audio_files_from_dropbox(folder_path: str) -> List[StarletteUploadFile]:
-    if not folder_path:
-        raise AudioValidationError("Dropbox folder path is required.")
-
-    access_token = get_app_config().dropbox_access_token
-    if not access_token:
-        raise AudioValidationError("Dropbox access token is missing.")
-
-    try:
-        # -----------------------------------------------
-        # Step 1: List files in folder
-        # -----------------------------------------------
-        list_headers = {
-            "Authorization": f"Bearer {access_token}",
-            "Content-Type": "application/json"
-        }
-
-        list_body = {
-            "path": folder_path,
-            "recursive": False
-        }
-
-        list_res = requests.post(
-            "https://api.dropboxapi.com/2/files/list_folder",
-            headers=list_headers,
-            json=list_body
-        )
-
-        if list_res.status_code != 200:
-            raise AudioValidationError(f"Dropbox API list_folder error: {list_res.text}")
-
-        items = list_res.json().get("entries", [])
-
-        # Filter audio files
-        audio_files_metadata = [
-            f for f in items
-            if f[".tag"] == "file" and f["name"].lower().endswith(AUDIO_EXTENSIONS)
-        ]
-
-        if not audio_files_metadata:
-            raise AudioValidationError("No audio files found in folder.")
-
-        wrapped_files = []
-        skipped_count = 0
-
-        # -----------------------------------------------
-        # Step 2: Download each audio file
-        # -----------------------------------------------
-        for item in audio_files_metadata:
-            dropbox_id = item["id"]  # Dropbox file ID
-
-            # Check if already processed
-            if await is_dropbox_file_already_processed(dropbox_id):
-                audio_logger.info(f"Skipping already processed file: {item['name']}")
-                skipped_count += 1
-                continue
-
-            wrapped_file = await download_and_wrap_dropbox_file(access_token, item)
-
-            # Attach Dropbox file ID
-            setattr(wrapped_file, "dropbox_file_id", dropbox_id)
-
-            wrapped_files.append(wrapped_file)
-
-        if not wrapped_files and skipped_count > 0:
-            raise AudioValidationError(
-                f"All {skipped_count} files in the folder have already been processed."
-            )
-
-        return wrapped_files
-
-    except Exception as e:
-        if isinstance(e, AudioValidationError):
-            raise
-        raise AudioValidationError(f"Dropbox API Error: {e}") from e
-
-
-async def is_dropbox_file_already_processed(dropbox_file_id: str) -> bool:
-    if not dropbox_file_id:
-        return False
-
-    from advanced_omi_backend.models.audio_file import AudioFile
-
-    existing_file = await AudioFile.find_one(
-        AudioFile.dropbox_file_id == dropbox_file_id
-    )
-
-    return existing_file is not None