Spaces:

dindizz
/

youtubetonewsstory

Sleeping

dindizz commited on Nov 26, 2024

Commit

394082a

verified ·

1 Parent(s): 3244187

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -28,20 +28,27 @@ def retrieve_transcript(video_url):
     # Parse the player response JSON using json.loads
     player = match.group(1)
-    player = json.loads(player)  # Use json.loads for secure parsing
     # Extract metadata
     metadata = {
-        "title": player["videoDetails"]["title"],
-        "duration": player["videoDetails"]["lengthSeconds"],
-        "author": player["videoDetails"]["author"],
-        "views": player["videoDetails"]["viewCount"],
     }
     # Get the tracks and sort them by priority
     tracks = player.get("captions", {}).get("playerCaptionsTracklistRenderer", {}).get("captionTracks", [])
     if not tracks:
-        return "No captions available for this video."
     # Sort tracks by priority
     tracks.sort(compare_tracks)
@@ -69,11 +76,6 @@ def retrieve_transcript(video_url):
         .replace("\s+", " ")
     )
-    result = {
-        "metadata": metadata,
-        "transcript": parsed_transcript,
-    }
     return f"Title: {metadata['title']}\nAuthor: {metadata['author']}\nViews: {metadata['views']}\nDuration: {metadata['duration']} seconds\n\nTranscript:\n{parsed_transcript}"

     # Parse the player response JSON using json.loads
     player = match.group(1)
+    try:
+        player = json.loads(player)  # Use json.loads for secure parsing
+    except json.JSONDecodeError:
+        return "Error decoding YouTube response. The response format may have changed."
+    # Check if videoDetails exists
+    if "videoDetails" not in player:
+        return "The video details could not be found. The video might be private, restricted, or unavailable."
     # Extract metadata
     metadata = {
+        "title": player["videoDetails"].get("title", "Unknown Title"),
+        "duration": player["videoDetails"].get("lengthSeconds", "Unknown Duration"),
+        "author": player["videoDetails"].get("author", "Unknown Author"),
+        "views": player["videoDetails"].get("viewCount", "Unknown Views"),
     }
     # Get the tracks and sort them by priority
     tracks = player.get("captions", {}).get("playerCaptionsTracklistRenderer", {}).get("captionTracks", [])
     if not tracks:
+        return f"Title: {metadata['title']}\n\nNo captions available for this video."
     # Sort tracks by priority
     tracks.sort(compare_tracks)
         .replace("\s+", " ")
     )
     return f"Title: {metadata['title']}\nAuthor: {metadata['author']}\nViews: {metadata['views']}\nDuration: {metadata['duration']} seconds\n\nTranscript:\n{parsed_transcript}"