1
0
mirror of https://github.com/mxpv/podsync.git synced 2024-05-11 05:55:04 +00:00
mxpv-podsync/cmd/resolver/function.py
2019-04-14 18:16:25 -07:00

191 lines
5.2 KiB
Python

import os
import youtube_dl
import boto3
from datetime import datetime, time
from dateutil.relativedelta import relativedelta
ANONYMOUS_FEED_REQUESTS_LIMIT = 1000
class InvalidUsage(Exception):
pass
class QuotaExceeded(Exception):
pass
dynamodb = boto3.resource('dynamodb')
feeds_table = dynamodb.Table(os.getenv('RESOLVER_DYNAMO_FEEDS_TABLE', 'Feeds'))
counter_table = dynamodb.Table(os.getenv('RESOLVER_DYNAMO_RESOLVE_COUNTERS_TABLE', 'ResolveCounters'))
opts = {
'quiet': True,
'no_warnings': True,
'forceurl': True,
'simulate': True,
'skip_download': True,
'call_home': False,
'nocheckcertificate': True
}
url_formats = {
'youtube': 'https://youtube.com/watch?v={}',
'vimeo': 'https://vimeo.com/{}',
}
def handler(event, context):
feed_id = event['feed_id']
video_id = event['video_id']
redirect_url = download(feed_id, video_id)
return {
'redirect_url': redirect_url,
}
def download(feed_id, video_id):
if not feed_id:
raise InvalidUsage('Invalid feed id')
# Remove extension and check if video id is ok
video_id = os.path.splitext(video_id)[0]
if not video_id:
raise InvalidUsage('Invalid video id')
# Query feed metadata info from DynamoDB
item = _get_metadata(feed_id)
# Update resolve requests counter
count = _update_resolve_counter(feed_id)
level = int(item['featurelevel'])
if count > ANONYMOUS_FEED_REQUESTS_LIMIT and level == 0:
raise QuotaExceeded('Too many requests. Daily limit is %d. Consider upgrading account to get unlimited '
'access' % ANONYMOUS_FEED_REQUESTS_LIMIT)
# Build URL
provider = item['provider']
tpl = url_formats[provider]
if not tpl:
raise InvalidUsage('Invalid feed')
url = tpl.format(video_id)
redirect_url = _resolve(url, item)
return redirect_url
def _get_metadata(feed_id):
response = feeds_table.get_item(
Key={'HashID': feed_id},
ProjectionExpression='#P,#F,#Q,#L',
ExpressionAttributeNames={
'#P': 'Provider',
'#F': 'Format',
'#Q': 'Quality',
'#L': 'FeatureLevel',
},
)
item = response['Item']
# Make dict keys lowercase
return dict((k.lower(), v) for k, v in item.items())
def _update_resolve_counter(feed_id):
if not feed_id:
return
now = datetime.utcnow()
day = now.strftime('%Y%m%d')
expires = now + relativedelta(months=3)
response = counter_table.update_item(
Key={
'FeedID': feed_id,
'Day': int(day),
},
UpdateExpression='ADD #count :one SET #exp = if_not_exists(#exp, :ttl)',
ExpressionAttributeNames={
'#count': 'Count',
'#exp': 'Expires',
},
ExpressionAttributeValues={
':one': 1,
':ttl': int(expires.timestamp()),
},
ReturnValues='UPDATED_NEW',
)
attrs = response['Attributes']
return attrs['Count']
def _resolve(url, metadata):
if not url:
raise InvalidUsage('Invalid URL')
print('Resolving %s' % url)
try:
provider = metadata['provider']
with youtube_dl.YoutubeDL(opts) as ytdl:
info = ytdl.extract_info(url, download=False)
if provider == 'youtube':
return _yt_choose_url(ytdl, info, metadata)
elif provider == 'vimeo':
return _vimeo_choose_url(info, metadata)
else:
raise ValueError('undefined provider')
except Exception as e:
print(e)
raise
def _yt_choose_url(ytdl, info, metadata):
is_video = metadata['format'] == 'video'
is_high_quality = metadata['quality'] == 'high'
if not is_video:
fmt = 'bestaudio' if is_high_quality else 'worstaudio'
selector = ytdl.build_format_selector(fmt)
try:
selected = next(selector(info))
if 'fragment_base_url' in selected:
return selected['fragment_base_url']
except KeyError:
pass
# Filter formats by file extension
ext = 'mp4' if is_video else 'm4a'
fmt_list = [x for x in info['formats'] if x['ext'] == ext and 'acodec' in x and x['acodec'] != 'none']
if not len(fmt_list):
return info['url']
# Sort list by field (width for videos, file size for audio)
sort_field = 'width' if is_video else 'filesize'
# Sometime 'filesize' field can be None
if not all(x[sort_field] is not None for x in fmt_list):
sort_field = 'format_id'
ordered = sorted(fmt_list, key=lambda x: x[sort_field], reverse=True)
# Choose an item depending on quality, better at the beginning
item = ordered[0] if is_high_quality else ordered[-1]
return item['url']
def _vimeo_choose_url(info, metadata):
# Query formats with 'extension' = mp4 and 'format_id' = http-1080p/http-720p/../http-360p
fmt_list = [x for x in info['formats'] if x['ext'] == 'mp4' and x['format_id'].startswith('http-')]
ordered = sorted(fmt_list, key=lambda x: x['width'], reverse=True)
is_high_quality = metadata['quality'] == 'high'
item = ordered[0] if is_high_quality else ordered[-1]
return item['url']