Spaces:

Kalp97
/

KalpTranscript

Sleeping

App Files Files Community

Kalp97 commited on Mar 22

Commit

9ea9b32

verified ·

1 Parent(s): 89f48e2

Update app.py

Browse files

Files changed (1) hide show

app.py +109 -16

app.py CHANGED Viewed

@@ -3,6 +3,8 @@ import whisper
 import yt_dlp
 import os
 import tempfile
 models = {}
@@ -38,8 +40,102 @@ def devanagari_to_roman(text):
     return ''.join(result)
 def download_from_url(url):
-    """Download audio from Instagram, YouTube, Twitter, Facebook using yt-dlp"""
     tmp_dir = tempfile.mkdtemp()
     output_path = os.path.join(tmp_dir, 'audio.%(ext)s')
     ydl_opts = {
@@ -47,7 +143,6 @@ def download_from_url(url):
         'outtmpl': output_path,
         'quiet': True,
         'no_warnings': True,
-        'extract_flat': False,
         'postprocessors': [{
             'key': 'FFmpegExtractAudio',
             'preferredcodec': 'mp3',
@@ -55,16 +150,9 @@ def download_from_url(url):
         }],
         'http_headers': {
             'User-Agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 17_0 like Mac OS X) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/17.0 Mobile/15E148 Safari/604.1',
-            'Accept-Language': 'en-US,en;q=0.9',
-            'Accept': '*/*',
-            'Referer': 'https://www.instagram.com/',
         },
-        'extractor_args': {
-            'instagram': {'api_version': 'v1'},
-        },
-        'socket_timeout': 30,
         'retries': 3,
-        'ignoreerrors': False,
         'geo_bypass': True,
     }
     try:
@@ -73,21 +161,19 @@ def download_from_url(url):
             title = info.get('title', 'video')
     except Exception as e:
         err = str(e)
-        if 'instagram' in err.lower() or '401' in err or '403' in err:
-            raise Exception("Instagram blocked this request. Try again in a few seconds, or make sure the post is public.")
-        elif 'private' in err.lower():
             raise Exception("This account is private. Only public posts can be downloaded.")
         elif 'not found' in err.lower() or '404' in err:
             raise Exception("Video not found. Check the URL and make sure the post still exists.")
         else:
             raise Exception(f"Download failed: {err}")
-    # Find the downloaded mp3
     for f in os.listdir(tmp_dir):
         if f.endswith('.mp3'):
             return os.path.join(tmp_dir, f), title
     raise Exception("Download succeeded but audio file not found.")
 def transcribe(file, model_name, language, show_timestamps, translate):
     if file is None:
         return "Please upload a video or audio file.", ""
@@ -161,7 +247,7 @@ def save_transcript(text):
 def download_video_only(url):
-    """Download video in highest quality and return file path"""
     if not url or not url.strip():
         return None, "Please paste a valid URL."
     url = url.strip()
@@ -169,6 +255,13 @@ def download_video_only(url):
                  'x.com','facebook.com','fb.watch']
     if not any(s in url.lower() for s in supported):
         return None, "Unsupported URL."
     tmp_dir = tempfile.mkdtemp()
     output_path = os.path.join(tmp_dir, 'video.%(ext)s')
     ydl_opts = {
@@ -522,4 +615,4 @@ by Kalpi Edition
     download_btn.click(fn=save_transcript, inputs=plain_output, outputs=download_file)
 if __name__ == "__main__":
-    demo.launch(css=custom_css)

 import yt_dlp
 import os
 import tempfile
+import requests
+import requests
 models = {}
     return ''.join(result)
+RAPIDAPI_KEY = "47b2f0d88bmsh7842ac99f4b2a3ep12df5djsn6f61065d9692"
+RAPIDAPI_HOST = "instagram-reels-downloader-api.p.rapidapi.com"
+def download_instagram_audio(url):
+    """Download Instagram reel via RapidAPI then extract audio"""
+    headers = {
+        "x-rapidapi-key": RAPIDAPI_KEY,
+        "x-rapidapi-host": RAPIDAPI_HOST,
+        "Content-Type": "application/json"
+    }
+    resp = requests.get(
+        f"https://{RAPIDAPI_HOST}/download",
+        headers=headers,
+        params={"url": url},
+        timeout=30
+    )
+    if resp.status_code != 200:
+        raise Exception(f"RapidAPI error {resp.status_code}: {resp.text[:200]}")
+    data = resp.json()
+    video_url = None
+    if isinstance(data, dict):
+        video_url = (data.get('url') or data.get('video_url') or
+                     data.get('download_url') or
+                     (data.get('data') or {}).get('url') or
+                     (data.get('data') or {}).get('video_url'))
+    elif isinstance(data, list) and len(data) > 0:
+        item = data[0]
+        video_url = item.get('url') or item.get('video_url') or item.get('download_url')
+    if not video_url:
+        raise Exception(f"No download URL in response: {str(data)[:300]}")
+    tmp_dir = tempfile.mkdtemp()
+    video_path = os.path.join(tmp_dir, 'ig_video.mp4')
+    audio_path = os.path.join(tmp_dir, 'audio.mp3')
+    vid_resp = requests.get(video_url, timeout=60, stream=True,
+        headers={"User-Agent":"Mozilla/5.0"})
+    with open(video_path, 'wb') as f:
+        for chunk in vid_resp.iter_content(chunk_size=8192):
+            f.write(chunk)
+    os.system(f'ffmpeg -i "{video_path}" -q:a 0 -map a "{audio_path}" -y -loglevel quiet')
+    if os.path.exists(audio_path) and os.path.getsize(audio_path) > 0:
+        return audio_path, 'instagram_reel'
+    return video_path, 'instagram_reel'
+RAPIDAPI_KEY = "47b2f0d88bmsh7842ac99f4b2a3ep12df5djsn6f61065d9692"
+RAPIDAPI_HOST = "instagram-reels-downloader-api.p.rapidapi.com"
+def download_instagram_via_rapidapi(url):
+    """Download Instagram reel using RapidAPI — reliable, no IP blocks"""
+    headers = {
+        "x-rapidapi-key": RAPIDAPI_KEY,
+        "x-rapidapi-host": RAPIDAPI_HOST,
+        "Content-Type": "application/json"
+    }
+    params = {"url": url}
+    resp = requests.get(
+        f"https://{RAPIDAPI_HOST}/download",
+        headers=headers,
+        params=params,
+        timeout=30
+    )
+    if resp.status_code != 200:
+        raise Exception(f"RapidAPI error {resp.status_code}: {resp.text[:200]}")
+    data = resp.json()
+    # Extract direct video URL from response
+    video_url = None
+    if isinstance(data, dict):
+        video_url = (data.get('url') or data.get('download_url') or
+                    data.get('video_url') or data.get('link'))
+        if not video_url and data.get('data'):
+            d = data['data']
+            if isinstance(d, list) and len(d) > 0:
+                video_url = d[0].get('url') or d[0].get('download_url')
+            elif isinstance(d, dict):
+                video_url = d.get('url') or d.get('download_url')
+    if not video_url:
+        raise Exception(f"No video URL in response: {str(data)[:300]}")
+    # Download the actual video file
+    tmp_dir = tempfile.mkdtemp()
+    tmp_path = os.path.join(tmp_dir, 'instagram.mp4')
+    video_resp = requests.get(video_url, timeout=60, stream=True)
+    with open(tmp_path, 'wb') as f:
+        for chunk in video_resp.iter_content(chunk_size=8192):
+            f.write(chunk)
+    return tmp_path, data.get('title', 'Instagram video')
 def download_from_url(url):
+    """Instagram → RapidAPI, everything else → yt-dlp"""
+    if 'instagram.com' in url.lower():
+        return download_instagram_audio(url)
     tmp_dir = tempfile.mkdtemp()
     output_path = os.path.join(tmp_dir, 'audio.%(ext)s')
     ydl_opts = {
         'outtmpl': output_path,
         'quiet': True,
         'no_warnings': True,
         'postprocessors': [{
             'key': 'FFmpegExtractAudio',
             'preferredcodec': 'mp3',
         }],
         'http_headers': {
             'User-Agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 17_0 like Mac OS X) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/17.0 Mobile/15E148 Safari/604.1',
         },
+        'socket_timeout': 60,
         'retries': 3,
         'geo_bypass': True,
     }
     try:
             title = info.get('title', 'video')
     except Exception as e:
         err = str(e)
+        if 'private' in err.lower():
             raise Exception("This account is private. Only public posts can be downloaded.")
         elif 'not found' in err.lower() or '404' in err:
             raise Exception("Video not found. Check the URL and make sure the post still exists.")
         else:
             raise Exception(f"Download failed: {err}")
     for f in os.listdir(tmp_dir):
         if f.endswith('.mp3'):
             return os.path.join(tmp_dir, f), title
     raise Exception("Download succeeded but audio file not found.")
 def transcribe(file, model_name, language, show_timestamps, translate):
     if file is None:
         return "Please upload a video or audio file.", ""
 def download_video_only(url):
+    """Download video — uses RapidAPI for Instagram, yt-dlp for others"""
     if not url or not url.strip():
         return None, "Please paste a valid URL."
     url = url.strip()
                  'x.com','facebook.com','fb.watch']
     if not any(s in url.lower() for s in supported):
         return None, "Unsupported URL."
+    # Use RapidAPI for Instagram
+    if 'instagram.com' in url.lower():
+        try:
+            tmp_path, title = download_instagram_via_rapidapi(url)
+            return tmp_path, title
+        except Exception as e:
+            return None, str(e)
     tmp_dir = tempfile.mkdtemp()
     output_path = os.path.join(tmp_dir, 'video.%(ext)s')
     ydl_opts = {
     download_btn.click(fn=save_transcript, inputs=plain_output, outputs=download_file)
 if __name__ == "__main__":
+    demo.launch(css=custom_css)