From 5fc96e59725e5c173f1861bf02e5226addf8d21c Mon Sep 17 00:00:00 2001 From: Pablo Aramburo Date: Fri, 16 Sep 2022 18:24:09 -0600 Subject: [PATCH] [add] More proxy sources --- scrape_proxies.py | 74 +++++++++++++++++++++++++++++++++++++++++++---- 1 file changed, 69 insertions(+), 5 deletions(-) diff --git a/scrape_proxies.py b/scrape_proxies.py index 0938bc1..c266f21 100644 --- a/scrape_proxies.py +++ b/scrape_proxies.py @@ -1,12 +1,76 @@ import requests import json -r = requests.get('https://raw.githubusercontent.com/fate0/proxylist/master/proxy.list') - formated_proxies = [] + +# fate0/proxylist +r = requests.get('https://raw.githubusercontent.com/fate0/proxylist/master/proxy.list') + for line in r.text.splitlines(): parsed = json.loads(line) - if bool(parsed['anonymity'] == 'high_anonymous'): - proxy_string = f'{parsed["type"]}://{parsed["host"]}:{parsed["port"]}' - print(proxy_string) \ No newline at end of file + #if bool(parsed['anonymity'] == 'high_anonymous'): + proxy_string = f'{parsed["type"]}://{parsed["host"]}:{parsed["port"]}' + formated_proxies.append(proxy_string) + +# ShiftyTR/Proxy-List +https = requests.get('https://raw.githubusercontent.com/ShiftyTR/Proxy-List/master/https.txt') +http = requests.get('https://raw.githubusercontent.com/ShiftyTR/Proxy-List/master/http.txt') + +for line in https.text.splitlines(): + proxy_string = f'https://{line}' + formated_proxies.append(proxy_string) + +for line in http.text.splitlines(): + proxy_string = f'http://{line}' + formated_proxies.append(proxy_string) + +# rdavydov/proxy-list +r = requests.get('https://raw.githubusercontent.com/rdavydov/proxy-list/main/proxies_anonymous/http.txt') + +for line in r.text.splitlines(): + proxy_string = f'http://{line}' + formated_proxies.append(proxy_string) + +# mmpx12/proxy-list +https = requests.get('https://raw.githubusercontent.com/mmpx12/proxy-list/master/https.txt') +http = requests.get('https://raw.githubusercontent.com/mmpx12/proxy-list/master/http.txt') + +for line in https.text.splitlines(): + proxy_string = f'https://{line}' + formated_proxies.append(proxy_string) + +for line in http.text.splitlines(): + proxy_string = f'http://{line}' + formated_proxies.append(proxy_string) + +# IshanSingla/proxy-list +# This one are updated infrequently +# https = requests.get('https://raw.githubusercontent.com/IshanSingla/proxy-list/main/proxys/https.txt') +# http = requests.get('https://raw.githubusercontent.com/IshanSingla/proxy-list/main/proxys/http.txt') + +# for line in https.text.splitlines(): +# proxy_string = f'https://{line}' +# formated_proxies.append(proxy_string) + +# for line in http.text.splitlines(): +# proxy_string = f'http://{line}' +# formated_proxies.append(proxy_string) + +# monosans/proxy-list +r = requests.get('https://raw.githubusercontent.com/monosans/proxy-list/main/proxies_anonymous/http.txt') + +for line in r.text.splitlines(): + proxy_string = f'http://{line}' + formated_proxies.append(proxy_string) + +# TheSpeedX/PROXY-List +r = requests.get('https://raw.githubusercontent.com/TheSpeedX/PROXY-List/master/http.txt') + +for line in r.text.splitlines(): + proxy_string = f'http://{line}' + formated_proxies.append(proxy_string) + +# ******************* +for x in list(set(formated_proxies)): + print(x) \ No newline at end of file