2022-03-10 14:26:22 +00:00
|
|
|
from bs4 import BeautifulSoup
|
|
|
|
import requests
|
|
|
|
|
|
|
|
from app import app
|
2022-05-01 16:23:45 +01:00
|
|
|
from app.extensions import db
|
2022-04-22 14:01:16 +01:00
|
|
|
from app.models.mirrors import Proxy
|
2022-03-10 14:26:22 +00:00
|
|
|
|
|
|
|
|
|
|
|
def check_blocks():
|
2022-05-01 16:38:41 +01:00
|
|
|
user_agent = {'User-agent': 'BypassCensorship/1.0'}
|
2022-03-10 14:26:22 +00:00
|
|
|
page = requests.get(app.config['EXTERNAL_CHECK_URL'], headers=user_agent)
|
|
|
|
soup = BeautifulSoup(page.content, 'html.parser')
|
|
|
|
h2 = soup.find_all('h2')
|
|
|
|
div = soup.find_all('div', class_="overflow-auto mb-5")
|
|
|
|
|
|
|
|
results = {}
|
|
|
|
|
|
|
|
i = 0
|
|
|
|
while i < len(h2):
|
|
|
|
if not div[i].div:
|
|
|
|
urls = []
|
|
|
|
a = div[i].find_all('a')
|
|
|
|
j = 0
|
|
|
|
while j < len(a):
|
|
|
|
urls.append(a[j].text)
|
|
|
|
j += 1
|
|
|
|
results[h2[i].text] = urls
|
|
|
|
else:
|
|
|
|
results[h2[i].text] = []
|
|
|
|
i += 1
|
|
|
|
|
|
|
|
for vp in results:
|
|
|
|
if vp not in app.config['EXTERNAL_VANTAGE_POINTS']:
|
|
|
|
continue
|
|
|
|
for url in results[vp]:
|
2022-05-01 16:38:41 +01:00
|
|
|
print(f"Found {url} blocked")
|
|
|
|
proxy = Proxy.query.filter(
|
|
|
|
Proxy.provider == "cloudfront",
|
|
|
|
Proxy.url == f"https://{url}"
|
|
|
|
).first()
|
|
|
|
if not proxy:
|
|
|
|
print("Proxy not found")
|
|
|
|
continue
|
|
|
|
if not proxy.origin.auto_rotation:
|
|
|
|
print("Proxy auto-rotation forbidden for origin")
|
|
|
|
if proxy.deprecated:
|
|
|
|
print("Proxy already marked blocked")
|
|
|
|
continue
|
|
|
|
proxy.deprecate(reason="external")
|
|
|
|
|
2022-05-01 16:23:45 +01:00
|
|
|
db.session.commit()
|
2022-03-10 14:26:22 +00:00
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
with app.app_context():
|
|
|
|
check_blocks()
|