2022-08-08 03:14:24 +09:00
# coding: utf-8
from __future__ import unicode_literals
from urllib import parse
from . common import InfoExtractor
2022-08-09 01:45:59 +09:00
from . . utils import (
clean_html ,
strip_or_none ,
unified_timestamp ,
urlencode_postdata ,
)
2022-08-08 03:14:24 +09:00
class ParlerIE ( InfoExtractor ) :
""" Extract videos from posts on Parler. """
2022-08-09 01:46:26 +09:00
_UUID_RE = r ' [0-9a-f] {8} -[0-9a-f] {4} -[0-9a-f] {4} -[0-9a-f] {4} -[0-9a-f] {12} '
_VALID_URL = r ' https://parler \ .com/feed/(?P<id> %s ) ' % ( _UUID_RE , )
2022-08-08 03:14:24 +09:00
_TESTS = [
{
2022-08-09 03:01:58 +09:00
' url ' : ' https://parler.com/feed/df79fdba-07cc-48fe-b085-3293897520d7 ' ,
' md5 ' : ' 16e0f447bf186bb3cf64de5bbbf4d22d ' ,
' info_dict ' : {
' id ' : ' df79fdba-07cc-48fe-b085-3293897520d7 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' Puberty-blocking procedures promoted by the Biden/Harris Admin are child abuse. The FDA has recently confirmed these hormones/drugs have extremely dangerous side effects, like brain swelling and vision loss. ' ,
' timestamp ' : 1659744000 ,
' upload_date ' : ' 20220806 ' ,
' uploader ' : ' Tulsi Gabbard ' ,
' uploader_id ' : ' TulsiGabbard ' ,
2022-08-08 03:14:24 +09:00
} ,
} ,
{
2022-08-09 03:01:58 +09:00
' url ' : ' https://parler.com/feed/a7406eb4-91e5-4793-b5e3-ade57a24e287 ' ,
' md5 ' : ' 11687e2f5bb353682cee338d181422ed ' ,
' info_dict ' : {
' id ' : ' a7406eb4-91e5-4793-b5e3-ade57a24e287 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' This man should run for office ' ,
' timestamp ' : 1659657600 ,
' upload_date ' : ' 20220805 ' ,
' uploader ' : ' Benny Johnson ' ,
' uploader_id ' : ' BennyJohnson ' ,
2022-08-08 03:14:24 +09:00
} ,
} ,
]
def _real_extract ( self , url ) :
video_id = self . _match_id ( url )
# Get data from API
2022-08-09 01:46:46 +09:00
api_url = ' https://parler.com/open-api/ParleyDetailEndpoint.php '
2022-08-08 03:14:24 +09:00
payload = parse . urlencode ( { " uuid " : video_id } ) . encode ( )
status = self . _download_json ( api_url , video_id , data = payload )
# Pull out video
2022-08-09 01:47:08 +09:00
url = status [ ' data ' ] [ 0 ] [ ' primary ' ] [ ' video_data ' ] [ ' videoSrc ' ]
# now we know this exists and is a dict
data = status [ ' data ' ] [ 0 ] [ ' primary ' ]
2022-08-08 03:14:24 +09:00
# Pull out metadata
title = clean_html ( data . get ( " full_body " ) ) . replace ( " \n " , " " )
2022-08-09 03:03:09 +09:00
timestamp = unified_timestamp ( data . get ( ' date_created ' ) )
2022-08-09 03:03:00 +09:00
uploader = strip_or_none ( data . get ( ' name ' ) )
uploader_id = strip_or_none ( data . get ( ' username ' ) )
2022-08-09 03:03:18 +09:00
uploader_url = ( ' https://parler.com/ ' + uploader_id ) if uploader_id else None
2022-08-08 03:14:24 +09:00
# Return the result
return {
2022-08-09 03:04:11 +09:00
' id ' : video_id ,
' url ' : url ,
' title ' : title ,
' timestamp ' : timestamp ,
' uploader ' : uploader ,
' uploader_id ' : uploader_id ,
' uploader_url ' : uploader_url ,
2022-08-08 03:14:24 +09:00
}