mirror of
https://git.sr.ht/~cadence/NewLeaf
synced 2024-11-14 12:07:30 +00:00
Lomanic
7d3b79b1cd
See https://github.com/benbusby/whoogle-search/issues/311 for some
context.
We're now implementing
a726009987/youtube_dl/extractor/youtube.py (L263-L264)
26 lines
1.1 KiB
Python
26 lines
1.1 KiB
Python
import re
|
|
import json
|
|
import random
|
|
|
|
r_yt_initial_data = re.compile(r"""(?:^\s*window\["ytInitialData"\]|var ytInitialData) = (\{.+?\});(?:\s*$|</script>)""", re.S + re.M)
|
|
r_yt_initial_player_response = re.compile(r"""(?:^\s*window\["ytInitialPlayerResponse"\]|var ytInitialPlayerResponse) = (\{.+?\});(?:\s*$|</script>|var )""", re.S + re.M)
|
|
|
|
def extract_yt_initial_data(content):
|
|
m_yt_initial_data = re.search(r_yt_initial_data, content)
|
|
if m_yt_initial_data:
|
|
yt_initial_data = json.loads(m_yt_initial_data.group(1))
|
|
return yt_initial_data
|
|
else:
|
|
raise Exception("Could not match ytInitialData in content")
|
|
|
|
def extract_yt_initial_player_response(content):
|
|
m_yt_initial_player_response = re.search(r_yt_initial_player_response, content)
|
|
if m_yt_initial_player_response:
|
|
yt_initial_player_response = json.loads(m_yt_initial_player_response.group(1))
|
|
return yt_initial_player_response
|
|
else:
|
|
raise Exception("Could not match ytInitialPlayerResponse in content")
|
|
|
|
def eu_consent_cookie():
|
|
return {"CONSENT": "YES+cb.20210509-17-p0.en+F+{}".format(random.randint(100, 999))}
|