Browse Source

Set host header for link validator (#2409)

pull/2653/head
Dmytro Khmelenko 3 years ago
committed by GitHub
parent
commit
3979c871cd
No known key found for this signature in database GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 8 additions and 1 deletions
  1. +8
    -1
      build/validate_links.py

+ 8
- 1
build/validate_links.py View File

@@ -51,9 +51,16 @@ def validate_links(links):
for link in links:
h = httplib2.Http(disable_ssl_certificate_validation=True, timeout=25)
try:
# fetching host name, removing leading www
host = link.split('//', 1)[1].split('/', 1)[0]
if host[:3] == 'www':
host = host[4:]
resp = h.request(link, headers={
# Faking user agent as some hosting services block not-whitelisted UA
'user-agent': 'Mozilla/5.0'
'user-agent': 'Mozilla/5.0',
# setting host because Cloudflare returns 403 asking for captcha if host is missing
'host': host
})
code = int(resp[0]['status'])
# Checking status code errors


Loading…
Cancel
Save