diff --git a/youtube_dl/extractor/truth.py b/youtube_dl/extractor/truth.py index 0f5b044f0..b48273779 100644 --- a/youtube_dl/extractor/truth.py +++ b/youtube_dl/extractor/truth.py @@ -3,38 +3,43 @@ from __future__ import unicode_literals from .common import InfoExtractor -from ..utils import clean_html, int_or_none, unified_timestamp +from ..utils import ( + clean_html, + int_or_none, + unified_timestamp, + strip_or_none +) class TruthIE(InfoExtractor): """Extract videos from posts on Donald Trump's truthsocial.com.""" - _VALID_URL = r"https://truthsocial\.com/@[^/]+/posts/(?P[0-9]+)" + _VALID_URL = r'https://truthsocial\.com/@[^/]+/posts/(?P[0-9]+)' _TESTS = [ { - "url": "https://truthsocial.com/@realDonaldTrump/posts/108779000807761862", - "md5": "4a5fb1470c192e493d9efd6f19e514d3", - "info_dict": { - "id": "108779000807761862", - "ext": "qt", - "title": "Untitled", - "timestamp": 1659835827, - "upload_date": "20220807", - "uploader": "Donald J. Trump", - "uploader_id": "realDonaldTrump", + 'url': 'https://truthsocial.com/@realDonaldTrump/posts/108779000807761862', + 'md5': '4a5fb1470c192e493d9efd6f19e514d3', + 'info_dict': { + 'id': '108779000807761862', + 'ext': 'qt', + 'title': '0d8691160c73d663', + 'timestamp': 1659835827, + 'upload_date': '20220807', + 'uploader': 'Donald J. Trump', + 'uploader_id': 'realDonaldTrump', }, }, { - "url": "https://truthsocial.com/@ProjectVeritasAction/posts/108618228543962049", - "md5": "fd47ba68933f9dce27accc52275be9c3", - "info_dict": { - "id": "108618228543962049", - "ext": "mp4", - "title": "RETRACTO #368: Utah NPR Affiliate RETRACTS False Claim Live On Air Following Veritas' Reporting on Curtis Campaign “Nothing I ever do will suffice for these people. They are engaged in conspiracy theories. They are doing precisely the thing they project that I do. Which is they don’t believe in facts, they don’t believe in logic, and they don’t believe in rationality.” - James O’Keefe", - "timestamp": 1657382637, - "upload_date": "20220709", - "uploader": "Project Veritas Action", - "uploader_id": "ProjectVeritasAction", + 'url': 'https://truthsocial.com/@ProjectVeritasAction/posts/108618228543962049', + 'md5': 'fd47ba68933f9dce27accc52275be9c3', + 'info_dict': { + 'id': '108618228543962049', + 'ext': 'mp4', + 'title': """RETRACTO #368: Utah NPR Affiliate RETRACTS False Claim Live On Air Following Veritas' Reporting on Curtis Campaign \n“Nothing I ever do will suffice for these people. They are engaged in conspiracy theories. They are doing precisely the thing they project that I do. Which is they don’t believe in facts, they don’t believe in logic, and they don’t believe in rationality.” - James O’Keefe""", + 'timestamp': 1657382637, + 'upload_date': '20220709', + 'uploader': 'Project Veritas Action', + 'uploader_id': 'ProjectVeritasAction', }, }, ] @@ -44,36 +49,33 @@ class TruthIE(InfoExtractor): video_id = self._match_id(url) # Get data from API - api_url = "https://truthsocial.com/api/v1/statuses/" + video_id + api_url = 'https://truthsocial.com/api/v1/statuses/' + video_id status = self._download_json(api_url, video_id) # Pull out video - attachments = status["media_attachments"] - video = attachments[0] - url = video["url"] + url = status['media_attachments'][0]['url'] # Pull out metadata - title = clean_html(status.get("content")).replace("\n", "") or "Untitled" - account = status.get("account") or {} - timestamp = unified_timestamp(status.get("created_at")) - uploader = account.get("display_name") - uploader_id = account.get("username") - uploader_url = ( - "https://truthsocial.com/@" + uploader_id if uploader_id else None - ) - repost_count = int_or_none(status.get("reblogs_count")) - like_count = int_or_none(status.get("favourites_count")) - comment_count = int_or_none(status.get("replies_count")) + title = strip_or_none(clean_html(status.get('content'))) or self._generic_title(url) + timestamp = unified_timestamp(status.get('created_at')) + account = status.get('account') or {} + uploader = strip_or_none(account.get('display_name')) + uploader_id = strip_or_none(account.get('username')) + uploader_url = ('https://truthsocial.com/@' + uploader_id) if uploader_id else None + repost_count = int_or_none(status.get('reblogs_count')) + like_count = int_or_none(status.get('favourites_count')) + comment_count = int_or_none(status.get('replies_count')) + # Return the stuff return { - "id": video_id, - "url": url, - "title": title, - "timestamp": timestamp, - "uploader": uploader, - "uploader_id": uploader_id, - "uploader_url": uploader_url, - "repost_count": repost_count, - "like_count": like_count, - "comment_count": comment_count, + 'id': video_id, + 'url': url, + 'title': title, + 'timestamp': timestamp, + 'uploader': uploader, + 'uploader_id': uploader_id, + 'uploader_url': uploader_url, + 'repost_count': repost_count, + 'like_count': like_count, + 'comment_count': comment_count, }