NewLeaf/index.py

157 lines
4.7 KiB
Python
Raw Normal View History

import cherrypy
import json
2021-04-03 01:00:05 +00:00
import pathlib
2020-08-07 14:51:32 +00:00
import requests
import yt_dlp
2020-08-13 14:20:11 +00:00
from extractors.video import extract_video
from extractors.channel import extract_channel, extract_channel_videos, extract_channel_latest
from extractors.manifest import extract_manifest
from extractors.search import extract_search
from extractors.suggestions import extract_search_suggestions
from extractors.captions import extract_captions
from extractors.comments import extract_comments
import configuration
2020-10-02 10:40:39 +00:00
@cherrypy.tools.register("before_finalize", priority=60)
def custom_headers():
2021-01-20 09:59:54 +00:00
cherrypy.response.headers["access-control-allow-origin"] = "*"
2020-08-09 08:38:40 +00:00
2021-02-27 00:09:31 +00:00
class NewLeaf(object):
def _cp_dispatch(self, vpath):
2020-08-09 08:38:40 +00:00
if vpath[:4] == ["api", "manifest", "dash", "id"]:
vpath[:4] = ["manifest"]
return self
2020-08-07 14:51:01 +00:00
if vpath[:2] == ["api", "v1"]:
endpoints = [
["channels", 1, 2],
["videos", 1, 1],
["search", 0, 1],
["captions", 1, 1],
["comments", 1, 1]
2020-08-07 14:51:01 +00:00
]
for e in endpoints:
2020-08-07 14:51:01 +00:00
if vpath[2] == e[0] and len(vpath) >= e[1]+3 and len(vpath) <= e[2]+3:
vpath[:3] = [e[0]]
return self
return vpath
@cherrypy.expose
@cherrypy.tools.json_out()
2020-08-09 11:42:15 +00:00
def videos(self, id, **kwargs):
2020-08-13 14:20:11 +00:00
return extract_video(id)
2020-08-09 08:38:40 +00:00
@cherrypy.expose
@cherrypy.tools.encode()
2020-08-09 11:42:15 +00:00
def manifest(self, id, **kwargs):
2020-08-13 14:20:11 +00:00
result = extract_manifest(id)
if type(result) is dict:
cherrypy.response.headers["content-type"] = "application/json"
return bytes(json.dumps(result), "utf8")
elif type(result) is requests.models.Response:
cherrypy.response.headers["content-type"] = result.headers["content-type"]
return result
else:
cherrypy.response.headers["content-type"] = "application/dash+xml"
return result
2020-08-09 08:38:40 +00:00
@cherrypy.expose
@cherrypy.tools.json_out()
def channels(self, *suffix, second__path="channel", **kwargs):
ucid = ""
part = ""
2020-08-13 14:20:11 +00:00
possible_parts = ("videos", "latest", "playlists")
if len(suffix) == 1:
ucid = suffix[0]
else: # len(suffix) >= 2
2020-08-13 14:20:11 +00:00
if suffix[0] in possible_parts:
[part, ucid] = suffix
2020-08-13 14:20:11 +00:00
elif suffix[1] in possible_parts:
[ucid, part] = suffix
2020-08-13 14:20:11 +00:00
else:
return {
2021-05-14 06:46:46 +00:00
"error": "Two components specified in URL, but neither component was recognised as a part keyword.",
"identifier": "PART_KEYWORD_NOT_RECOGNISED"
2020-08-13 14:20:11 +00:00
}
possible_paths = ("channel",) if part == "latest" else ("channel", "c", "user")
if second__path not in possible_paths:
return {
"error": "second__path parameter must be one of: " + str(possible_paths),
"identifier": "PATH_PARAMETER_NOT_RECOGNISED"
}
2020-08-13 08:25:10 +00:00
if part == "playlists":
return []
2020-08-13 14:20:11 +00:00
elif part == "latest":
return extract_channel_latest(ucid)
2020-08-13 14:20:11 +00:00
elif part == "videos":
return extract_channel_videos(ucid, second__path)
2020-08-13 14:20:11 +00:00
else: # part == "", so extract whole channel
return extract_channel(ucid, second__path)
2020-08-07 14:51:01 +00:00
@cherrypy.expose
@cherrypy.tools.json_out()
2020-08-10 07:25:15 +00:00
def search(self, *suffix, q, **kwargs):
if suffix == ("suggestions",):
return self.suggestions(q=q)
2020-08-13 14:20:11 +00:00
return extract_search(q)
2020-08-07 14:51:01 +00:00
2020-08-10 07:25:15 +00:00
@cherrypy.expose
@cherrypy.tools.json_out()
def suggestions(self, *, q, **kwargs):
return extract_search_suggestions(q)
2021-01-20 04:35:24 +00:00
@cherrypy.expose
def captions(self, id, **kwargs):
2021-01-20 04:35:24 +00:00
try:
result = extract_captions(id, **kwargs)
if type(result) is dict:
cherrypy.response.headers["content-type"] = "application/json"
return bytes(json.dumps(result), "utf8")
else:
cherrypy.response.headers["content-type"] = "text/vtt; charset=UTF-8"
return result
2021-01-20 04:35:24 +00:00
except StopIteration:
cherrypy.response.status = "400"
cherrypy.response.headers["content-type"] = "application/json"
return bytes(json.dumps({
"error": "No captions matching that language or label",
"identifier": "NO_MATCHING_CAPTIONS"
}), "utf8")
2020-08-10 07:25:15 +00:00
@cherrypy.expose
@cherrypy.tools.json_out()
def comments(self, id, **kwargs):
return extract_comments(id)
2020-08-07 14:51:32 +00:00
@cherrypy.expose
def vi(self, id, file):
r = requests.get("https://i.ytimg.com/vi/{}/{}".format(id, file), stream=True)
r.raise_for_status()
cherrypy.response.headers["content-type"] = r.headers["content-type"]
return next(r.iter_content(chunk_size=None))
2020-08-07 14:51:32 +00:00
@cherrypy.expose
def ggpht(self, *path):
r = requests.get("https://yt3.ggpht.com/{}".format("/".join(path)), stream=True)
r.raise_for_status()
cherrypy.response.headers["content-type"] = r.headers["content-type"]
return next(r.iter_content(chunk_size=None))
bind_port = getattr(configuration, "bind_port", 3000)
bind_host = getattr(configuration, "bind_host", "0.0.0.0")
2021-04-03 01:00:05 +00:00
server_root = pathlib.Path(__file__).parent.joinpath("root")
cherrypy.config.update({"server.socket_port": bind_port, "server.socket_host": bind_host})
2021-02-27 00:09:31 +00:00
cherrypy.quickstart(NewLeaf(), "/", {
2020-10-02 10:40:39 +00:00
"/": {
2021-04-03 01:00:05 +00:00
"tools.custom_headers.on": True,
"tools.staticdir.on": True,
"tools.staticdir.dir": str(server_root.absolute()),
"tools.staticdir.index": "index.html"
2020-10-02 10:40:39 +00:00
}
})