mobe bypass captcha into job class

2025-08-06 12:48:29 +00:00 · 2020-10-16 21:00:04 -05:00 · 2020-10-16 21:00:04 -05:00 · 496a78bafe
commit 496a78bafe
parent ddc8892624
3 changed files with 137 additions and 130 deletions
--- a/src/invidious.cr
+++ b/src/invidious.cr
@ -167,6 +167,10 @@ if config.statistics_enabled
  Invidious::Jobs.register Invidious::Jobs::StatisticsRefreshJob.new(PG_DB, config, SOFTWARE)
 end

+if CONFIG.captcha_key
+  Invidious::Jobs.register Invidious::Jobs::BypassCaptchaJob.new(logger, config)
+end
+
 Invidious::Jobs.register Invidious::Jobs::PullPopularVideosJob.new(PG_DB)
 Invidious::Jobs.register Invidious::Jobs::UpdateDecryptFunctionJob.new
 Invidious::Jobs.start_all
@ -177,20 +181,6 @@ end

 DECRYPT_FUNCTION = Invidious::Jobs::UpdateDecryptFunctionJob::DECRYPT_FUNCTION

-if CONFIG.captcha_key
-  spawn do
-    bypass_captcha(CONFIG.captcha_key, logger) do |cookies|
-      cookies.each do |cookie|
-        config.cookies << cookie
-      end
-
-      # Persist cookies between runs
-      CONFIG.cookies = config.cookies
-      File.write("config/config.yml", config.to_yaml)
-    end
-  end
-end
-
 connection_channel = Channel({Bool, Channel(PQ::Notification)}).new(32)
 spawn do
  connections = [] of Channel(PQ::Notification)
--- a/src/invidious/helpers/jobs.cr
+++ b/src/invidious/helpers/jobs.cr
@ -65,122 +65,6 @@ def pull_popular_videos(db)
  end
 end

-def bypass_captcha(captcha_key, logger)
-  loop do
-    begin
-      {"/watch?v=CvFH_6DNRCY&gl=US&hl=en&has_verified=1&bpctr=9999999999", produce_channel_videos_url(ucid: "UCXuqSBlHAE6Xw-yeJA0Tunw")}.each do |path|
-        response = YT_POOL.client &.get(path)
-        if response.body.includes?("To continue with your YouTube experience, please fill out the form below.")
-          html = XML.parse_html(response.body)
-          form = html.xpath_node(%(//form[@action="/das_captcha"])).not_nil!
-          site_key = form.xpath_node(%(.//div[@id="recaptcha"])).try &.["data-sitekey"]
-          s_value = form.xpath_node(%(.//div[@id="recaptcha"])).try &.["data-s"]
-
-          inputs = {} of String => String
-          form.xpath_nodes(%(.//input[@name])).map do |node|
-            inputs[node["name"]] = node["value"]
-          end
-
-          headers = response.cookies.add_request_headers(HTTP::Headers.new)
-
-          response = JSON.parse(HTTP::Client.post("https://api.anti-captcha.com/createTask", body: {
-            "clientKey" => CONFIG.captcha_key,
-            "task"      => {
-              "type"                => "NoCaptchaTaskProxyless",
-              "websiteURL"          => "https://www.youtube.com#{path}",
-              "websiteKey"          => site_key,
-              "recaptchaDataSValue" => s_value,
-            },
-          }.to_json).body)
-
-          raise response["error"].as_s if response["error"]?
-          task_id = response["taskId"].as_i
-
-          loop do
-            sleep 10.seconds
-
-            response = JSON.parse(HTTP::Client.post("https://api.anti-captcha.com/getTaskResult", body: {
-              "clientKey" => CONFIG.captcha_key,
-              "taskId"    => task_id,
-            }.to_json).body)
-
-            if response["status"]?.try &.== "ready"
-              break
-            elsif response["errorId"]?.try &.as_i != 0
-              raise response["errorDescription"].as_s
-            end
-          end
-
-          inputs["g-recaptcha-response"] = response["solution"]["gRecaptchaResponse"].as_s
-          headers["Cookies"] = response["solution"]["cookies"].as_h?.try &.map { |k, v| "#{k}=#{v}" }.join("; ") || ""
-          response = YT_POOL.client &.post("/das_captcha", headers, form: inputs)
-
-          yield response.cookies.select { |cookie| cookie.name != "PREF" }
-        elsif response.headers["Location"]?.try &.includes?("/sorry/index")
-          location = response.headers["Location"].try { |u| URI.parse(u) }
-          headers = HTTP::Headers{":authority" => location.host.not_nil!}
-          response = YT_POOL.client &.get(location.full_path, headers)
-
-          html = XML.parse_html(response.body)
-          form = html.xpath_node(%(//form[@action="index"])).not_nil!
-          site_key = form.xpath_node(%(.//div[@id="recaptcha"])).try &.["data-sitekey"]
-          s_value = form.xpath_node(%(.//div[@id="recaptcha"])).try &.["data-s"]
-
-          inputs = {} of String => String
-          form.xpath_nodes(%(.//input[@name])).map do |node|
-            inputs[node["name"]] = node["value"]
-          end
-
-          captcha_client = HTTPClient.new(URI.parse("https://api.anti-captcha.com"))
-          captcha_client.family = CONFIG.force_resolve || Socket::Family::INET
-          response = JSON.parse(captcha_client.post("/createTask", body: {
-            "clientKey" => CONFIG.captcha_key,
-            "task"      => {
-              "type"                => "NoCaptchaTaskProxyless",
-              "websiteURL"          => location.to_s,
-              "websiteKey"          => site_key,
-              "recaptchaDataSValue" => s_value,
-            },
-          }.to_json).body)
-
-          raise response["error"].as_s if response["error"]?
-          task_id = response["taskId"].as_i
-
-          loop do
-            sleep 10.seconds
-
-            response = JSON.parse(captcha_client.post("/getTaskResult", body: {
-              "clientKey" => CONFIG.captcha_key,
-              "taskId"    => task_id,
-            }.to_json).body)
-
-            if response["status"]?.try &.== "ready"
-              break
-            elsif response["errorId"]?.try &.as_i != 0
-              raise response["errorDescription"].as_s
-            end
-          end
-
-          inputs["g-recaptcha-response"] = response["solution"]["gRecaptchaResponse"].as_s
-          headers["Cookies"] = response["solution"]["cookies"].as_h?.try &.map { |k, v| "#{k}=#{v}" }.join("; ") || ""
-          response = YT_POOL.client &.post("/sorry/index", headers: headers, form: inputs)
-          headers = HTTP::Headers{
-            "Cookie" => URI.parse(response.headers["location"]).query_params["google_abuse"].split(";")[0],
-          }
-          cookies = HTTP::Cookies.from_headers(headers)
-
-          yield cookies
-        end
-      end
-    rescue ex
-      logger.puts("Exception: #{ex.message}")
-    ensure
-      sleep 1.minute
-      Fiber.yield
-    end
-  end
-end
-
 def find_working_proxies(regions)
  loop do
    regions.each do |region|
--- a/src/invidious/jobs/bypass_captcha_job.cr
+++ b/src/invidious/jobs/bypass_captcha_job.cr
@ -0,0 +1,133 @@
+class Invidious::Jobs::BypassCaptchaJob < Invidious::Jobs::BaseJob
+  private getter logger : Invidious::LogHandler
+  private getter config : Config
+
+  def initialize(@logger, @config)
+  end
+
+  def begin
+    loop do
+      begin
+        {"/watch?v=CvFH_6DNRCY&gl=US&hl=en&has_verified=1&bpctr=9999999999", produce_channel_videos_url(ucid: "UCXuqSBlHAE6Xw-yeJA0Tunw")}.each do |path|
+          response = YT_POOL.client &.get(path)
+          if response.body.includes?("To continue with your YouTube experience, please fill out the form below.")
+            html = XML.parse_html(response.body)
+            form = html.xpath_node(%(//form[@action="/das_captcha"])).not_nil!
+            site_key = form.xpath_node(%(.//div[@id="recaptcha"])).try &.["data-sitekey"]
+            s_value = form.xpath_node(%(.//div[@id="recaptcha"])).try &.["data-s"]
+  
+            inputs = {} of String => String
+            form.xpath_nodes(%(.//input[@name])).map do |node|
+              inputs[node["name"]] = node["value"]
+            end
+  
+            headers = response.cookies.add_request_headers(HTTP::Headers.new)
+  
+            response = JSON.parse(HTTP::Client.post("https://api.anti-captcha.com/createTask", body: {
+              "clientKey" => config.captcha_key,
+              "task"      => {
+                "type"                => "NoCaptchaTaskProxyless",
+                "websiteURL"          => "https://www.youtube.com#{path}",
+                "websiteKey"          => site_key,
+                "recaptchaDataSValue" => s_value,
+              },
+            }.to_json).body)
+  
+            raise response["error"].as_s if response["error"]?
+            task_id = response["taskId"].as_i
+  
+            loop do
+              sleep 10.seconds
+  
+              response = JSON.parse(HTTP::Client.post("https://api.anti-captcha.com/getTaskResult", body: {
+                "clientKey" => config.captcha_key,
+                "taskId"    => task_id,
+              }.to_json).body)
+  
+              if response["status"]?.try &.== "ready"
+                break
+              elsif response["errorId"]?.try &.as_i != 0
+                raise response["errorDescription"].as_s
+              end
+            end
+  
+            inputs["g-recaptcha-response"] = response["solution"]["gRecaptchaResponse"].as_s
+            headers["Cookies"] = response["solution"]["cookies"].as_h?.try &.map { |k, v| "#{k}=#{v}" }.join("; ") || ""
+            response = YT_POOL.client &.post("/das_captcha", headers, form: inputs)
+  
+            response.cookies
+                    .select { |cookie| cookie.name != "PREF" }
+                    .each { |cookie| config.cookies << cookie }
+      
+            # Persist cookies between runs
+            config.cookies = config.cookies
+            File.write("config/config.yml", config.to_yaml)
+          elsif response.headers["Location"]?.try &.includes?("/sorry/index")
+            location = response.headers["Location"].try { |u| URI.parse(u) }
+            headers = HTTP::Headers{":authority" => location.host.not_nil!}
+            response = YT_POOL.client &.get(location.full_path, headers)
+  
+            html = XML.parse_html(response.body)
+            form = html.xpath_node(%(//form[@action="index"])).not_nil!
+            site_key = form.xpath_node(%(.//div[@id="recaptcha"])).try &.["data-sitekey"]
+            s_value = form.xpath_node(%(.//div[@id="recaptcha"])).try &.["data-s"]
+  
+            inputs = {} of String => String
+            form.xpath_nodes(%(.//input[@name])).map do |node|
+              inputs[node["name"]] = node["value"]
+            end
+  
+            captcha_client = HTTPClient.new(URI.parse("https://api.anti-captcha.com"))
+            captcha_client.family = config.force_resolve || Socket::Family::INET
+            response = JSON.parse(captcha_client.post("/createTask", body: {
+              "clientKey" => config.captcha_key,
+              "task"      => {
+                "type"                => "NoCaptchaTaskProxyless",
+                "websiteURL"          => location.to_s,
+                "websiteKey"          => site_key,
+                "recaptchaDataSValue" => s_value,
+              },
+            }.to_json).body)
+  
+            raise response["error"].as_s if response["error"]?
+            task_id = response["taskId"].as_i
+  
+            loop do
+              sleep 10.seconds
+  
+              response = JSON.parse(captcha_client.post("/getTaskResult", body: {
+                "clientKey" => config.captcha_key,
+                "taskId"    => task_id,
+              }.to_json).body)
+  
+              if response["status"]?.try &.== "ready"
+                break
+              elsif response["errorId"]?.try &.as_i != 0
+                raise response["errorDescription"].as_s
+              end
+            end
+  
+            inputs["g-recaptcha-response"] = response["solution"]["gRecaptchaResponse"].as_s
+            headers["Cookies"] = response["solution"]["cookies"].as_h?.try &.map { |k, v| "#{k}=#{v}" }.join("; ") || ""
+            response = YT_POOL.client &.post("/sorry/index", headers: headers, form: inputs)
+            headers = HTTP::Headers{
+              "Cookie" => URI.parse(response.headers["location"]).query_params["google_abuse"].split(";")[0],
+            }
+            cookies = HTTP::Cookies.from_headers(headers)
+  
+            cookies.each { |cookie| config.cookies << cookie }
+      
+            # Persist cookies between runs
+            config.cookies = config.cookies
+            File.write("config/config.yml", config.to_yaml)
+          end
+        end
+      rescue ex
+        logger.puts("Exception: #{ex.message}")
+      ensure
+        sleep 1.minute
+        Fiber.yield
+      end
+    end
+  end
+end