Files
polyphemus/polyphemus/api.py

372 lines
9.7 KiB
Python

# -*- coding: UTF-8 -*-
"""Functions to request and process information from Odysee APIs
"""
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
import json
from urllib.parse import quote
import requests
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
#TODO Figure out how to reverse-engineer this
AUTH_TOKEN = 'BseGAiye641UqUsv4g31ZcUCRiLasv3U'
# API endpoints for Odysee data
#-----------------------------------------------------------------------------#
BACKEND_API_URL = 'https://api.na-backend.odysee.com/api/v1/proxy'
SUBSCRIBER_API_URL = 'https://api.odysee.com/subscription/sub_count'
VIEW_API_URL = 'https://api.odysee.com/file/view_count'
REACTION_API_URL = 'https://api.odysee.com/reaction/list'
COMMENT_API_URL = 'https://comments.odysee.com/api/v2'
RECOMMENDATION_API_URL = 'https://recsys.odysee.com/search'
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def make_request(request, kwargs):
"""Wrapper for retrying request multiple times.
"""
if request not in [requests.get, requests.post]:
msg = f'`request` argument must be either `requests.get` or `requests.post`, not {type(request)}'
raise ValueError(msg)
n_retries = 0
response = request(**kwargs)
while response.status_code != 200 and n_retries < 5:
n_retries += 1
response = request(**kwargs)
if response.status_code != 200:
msg = f'Maximum number of retries reached for request {request} with kwargs {kwargs}'
raise ValueError(msg)
return response
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def get_channel_info(channel_name):
"""Get the channel information and ID from the channel name.
"""
channel_url = f'lbry://@{channel_name}'
json_data = {
"jsonrpc":"2.0",
"method":"resolve",
"params":{
"urls":[channel_url]}}
response = make_request(
request = requests.post,
kwargs = {
'url' : BACKEND_API_URL,
'json': json_data})
result = json.loads(response.text)
info = result['result'][channel_url]
info = {
'channel_id' : info['claim_id'],
'title' : info['value'].get('title'),
'created': info['timestamp'],
'description': info['value'].get('description'),
'cover_image': info['value'].get('cover',{}).get('url'),
'thumbnail_image': info['value'].get('thumbnail',{}).get('url'),
'raw' : response.text}
return info
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def get_subscribers(claim_id):
"""Get the number of subscribers for a channel.
"""
json_data = {
'auth_token': AUTH_TOKEN,
'claim_id': claim_id }
response = make_request(
request = requests.post,
kwargs = {
'url' : SUBSCRIBER_API_URL,
'data': json_data})
result = json.loads(response.text)
subscribers = result['data'][0]
return subscribers
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def get_all_videos(channel_id):
"""Get a list of all videos posted by a specified channel name.
Returns
-------
all_videos: list<dict>
List of dictionaries, with each dict corresponding to a JSON response
containing data about a single video.
"""
all_videos = []
page = 1
while True:
json_data = {
"jsonrpc":"2.0",
"method":"claim_search",
"params":{
"page_size":30,
"page":page,
"order_by":["release_time"],
"channel_ids":[channel_id]}}
response = make_request(
request = requests.post,
kwargs = {
'url' : BACKEND_API_URL,
'json': json_data})
result = json.loads(response.text)
videos = result['result']['items']
if not videos:
break
else:
all_videos.extend(videos)
page += 1
return all_videos
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def get_views(claim_id):
"""Get the number of views for a given video.
"""
params = {
'auth_token': AUTH_TOKEN,
'claim_id': claim_id }
response = make_request(
request = requests.get,
kwargs = {
'url' : VIEW_API_URL,
'params': params})
views = json.loads(response.text)['data'][0]
return views
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def get_video_reactions(claim_id):
"""Get all reactions for a given video.
"""
post_data = {
'auth_token': AUTH_TOKEN,
'claim_ids': claim_id }
response = make_request(
request = requests.post,
kwargs = {
'url' : REACTION_API_URL,
'data': post_data})
result = json.loads(response.text)
if result['success']:
reactions = result['data']['others_reactions'][claim_id ]
return reactions['like'], reactions['dislike']
else:
return None, None
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def get_all_comments(claim_id):
"""Get a list of all comments for a single video.
Parameters
----------
claim_id: str
Claim ID for the video whose comments are to be scraped
e.g. ``'84d2a91e910bee523af5422439a639f677b9c78f'``
Returns
-------
all_comments: list<dict>
List of dictionaries, with each dict corresponding to a JSON response
containing data about a single comment for the specified video.
"""
all_comments = []
page = 1
while True:
json_data = {
"jsonrpc":"2.0",
"id":1,
"method":"comment.List",
"params":{
"page":page,
"claim_id":claim_id,
"page_size":10,
"top_level":False,
"sort_by":3}}
response = make_request(
request = requests.post,
kwargs = {
'url' : COMMENT_API_URL,
'json': json_data})
result = json.loads(response.text)
if 'items' not in result['result']:
break
else:
_comments = result['result']['items']
comments = append_comment_reactions(comments = _comments)
all_comments.extend(comments)
page += 1
return all_comments
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def append_comment_reactions(comments):
"""Get reaction data for each comment and insert ``'reactions'`` key into
dict for each comment.
Parameters
----------
comments: list<dict>
List of dictionaries, with each dict corresponding to a JSON response
containing data about a single comment for the specified video.
Returns
-------
comments: list<dict>
List of dictionaries, with each dict corresponding to a JSON response
containing data about a single comment for the specified video, with
additional ``'reactions'`` field containing reaction information for
each comment.
"""
comment_ids = ','.join([c['comment_id'] for c in comments])
json_data = {
"jsonrpc":"2.0",
"id":1,
"method":"reaction.List",
"params":{
"comment_ids":comment_ids}}
response = make_request(
request = requests.post,
kwargs = {
'url' : COMMENT_API_URL,
'json': json_data})
result = json.loads(response.text)
reactions = result['result']['others_reactions']
for comment in comments:
comment['likes'] = reactions[comment['comment_id']]['like']
comment['dislikes'] = reactions[comment['comment_id']]['dislike']
return comments
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def get_recommended(title, claim_id):
name = quote(title)
params = {
's':name,
'size':'20',
'from':'0',
'related_to':claim_id}
response = make_request(
request = requests.get,
kwargs = {
'url' : RECOMMENDATION_API_URL,
'params': params})
result = json.loads(response.text)
recommended_video_info = [ name_to_video_info(r['name']) for r in result]
recommended_video_info = [vi for vi in recommended_video_info if ((vi.get('value_type') == 'stream') & any(key in vi.get('value', []) for key in ('video', 'audio')))]
return recommended_video_info
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def name_to_video_info(name):
video_url = f"lbry://{name}"
json_data = {
"jsonrpc":"2.0",
"method":"resolve",
"params":{
"urls":[video_url]}}
response = make_request(
request = requests.post,
kwargs = {
'url' : BACKEND_API_URL,
'json': json_data})
result = json.loads(response.text)
return result['result'][video_url]
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#
def get_streaming_url(canonical_url):
json_data = {
"jsonrpc":"2.0",
"method":"get",
"params":{
"uri":canonical_url}}
response = make_request(
request = requests.post,
kwargs = {
'url' : BACKEND_API_URL,
'json': json_data})
video_url = json.loads(response.text)['result'].get('streaming_url')
return video_url
#+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++#