diff options
| author | TheFrenchGhosty <47571719+TheFrenchGhosty@users.noreply.github.com> | 2020-11-26 17:28:34 +0000 |
|---|---|---|
| committer | GitHub <noreply@github.com> | 2020-11-26 17:28:34 +0000 |
| commit | 99ba9874b11bb0a5b67854d338ce968e83c69c41 (patch) | |
| tree | 733fcd8978a2bbce3a5e1d14690bc2a184ba4896 /src | |
| parent | 1973f93d4a2b54f7284cc407ef05da232272269b (diff) | |
| parent | b41ca72d2b85c8d6ee5186873bf4be4c331e3798 (diff) | |
| download | invidious-99ba9874b11bb0a5b67854d338ce968e83c69c41.tar.gz invidious-99ba9874b11bb0a5b67854d338ce968e83c69c41.tar.bz2 invidious-99ba9874b11bb0a5b67854d338ce968e83c69c41.zip | |
Merge pull request #1490 from tirz/fix-regex_parsing
fix: ytInitialData parsing with regex
Diffstat (limited to 'src')
| -rw-r--r-- | src/invidious/channels.cr | 31 | ||||
| -rw-r--r-- | src/invidious/helpers/helpers.cr | 7 | ||||
| -rw-r--r-- | src/invidious/videos.cr | 3 |
3 files changed, 14 insertions, 27 deletions
diff --git a/src/invidious/channels.cr b/src/invidious/channels.cr index 656b9953..392c44ee 100644 --- a/src/invidious/channels.cr +++ b/src/invidious/channels.cr @@ -775,38 +775,31 @@ def extract_channel_community_cursor(continuation) cursor end -INITDATA_PREQUERY = "window[\"ytInitialData\"] = {" - def get_about_info(ucid, locale) - about = YT_POOL.client &.get("/channel/#{ucid}/about?gl=US&hl=en") - if about.status_code != 200 - about = YT_POOL.client &.get("/user/#{ucid}/about?gl=US&hl=en") + result = YT_POOL.client &.get("/channel/#{ucid}/about?gl=US&hl=en") + if result.status_code != 200 + result = YT_POOL.client &.get("/user/#{ucid}/about?gl=US&hl=en") end - if md = about.headers["location"]?.try &.match(/\/channel\/(?<ucid>UC[a-zA-Z0-9_-]{22})/) + if md = result.headers["location"]?.try &.match(/\/channel\/(?<ucid>UC[a-zA-Z0-9_-]{22})/) raise ChannelRedirect.new(channel_id: md["ucid"]) end - if about.status_code != 200 + if result.status_code != 200 error_message = translate(locale, "This channel does not exist.") raise error_message end - initdata_pre = about.body.index(INITDATA_PREQUERY) - initdata_post = initdata_pre.nil? ? nil : about.body.index("};", initdata_pre) - if initdata_post.nil? - about = XML.parse_html(about.body) - error_message = about.xpath_node(%q(//div[@class="yt-alert-content"])).try &.content.strip - error_message ||= translate(locale, "Could not get channel info.") + about = XML.parse_html(result.body) + if about.xpath_node(%q(//div[contains(@class, "channel-empty-message")])) + error_message = translate(locale, "This channel does not exist.") raise error_message end - initdata_pre = initdata_pre.not_nil! + INITDATA_PREQUERY.size - 1 - initdata = JSON.parse(about.body[initdata_pre, initdata_post - initdata_pre + 1]) - about = XML.parse_html(about.body) - - if about.xpath_node(%q(//div[contains(@class, "channel-empty-message")])) - error_message = translate(locale, "This channel does not exist.") + initdata = extract_initial_data(result.body) + if initdata.empty? + error_message = about.xpath_node(%q(//div[@class="yt-alert-content"])).try &.content.strip + error_message ||= translate(locale, "Could not get channel info.") raise error_message end diff --git a/src/invidious/helpers/helpers.cr b/src/invidious/helpers/helpers.cr index 620d2ec8..7a0cb3d3 100644 --- a/src/invidious/helpers/helpers.cr +++ b/src/invidious/helpers/helpers.cr @@ -598,12 +598,7 @@ def create_notification_stream(env, topics, connection_channel) end def extract_initial_data(body) : Hash(String, JSON::Any) - initial_data = body.match(/(window\["ytInitialData"\]|var\s+ytInitialData)\s*=\s*(?<info>.*?);+\s*\n/).try &.["info"] || "{}" - if initial_data.starts_with?("JSON.parse(\"") - return JSON.parse(JSON.parse(%({"initial_data":"#{initial_data[12..-3]}"}))["initial_data"].as_s).as_h - else - return JSON.parse(initial_data).as_h - end + return JSON.parse(body.match(/(window\["ytInitialData"\]|var\s*ytInitialData)\s*=\s*(JSON\.parse\(")?(?<info>\{.*?\})("\))?;/m).try &.["info"] || "{}").as_h end def proxy_file(response, env) diff --git a/src/invidious/videos.cr b/src/invidious/videos.cr index 8e314fe0..20048460 100644 --- a/src/invidious/videos.cr +++ b/src/invidious/videos.cr @@ -839,8 +839,7 @@ def extract_polymer_config(body) params[f] = player_response[f] if player_response[f]? end - yt_initial_data = body.match(/(window\["ytInitialData"\]|var\s+ytInitialData)\s*=\s*(?<info>.*?);\s*\n/) - .try { |r| JSON.parse(r["info"]).as_h } + yt_initial_data = extract_initial_data(body) params["relatedVideos"] = yt_initial_data.try &.["playerOverlays"]?.try &.["playerOverlayRenderer"]? .try &.["endScreen"]?.try &.["watchNextEndScreenRenderer"]?.try &.["results"]?.try &.as_a.compact_map { |r| |
