diff options
| author | Gertjan van den Burg <gertjanvandenburg@gmail.com> | 2020-01-07 14:26:31 +0000 |
|---|---|---|
| committer | Gertjan van den Burg <gertjanvandenburg@gmail.com> | 2020-01-07 14:26:31 +0000 |
| commit | 2b4fc42e99f08052fe73f92845f4b155d05fee25 (patch) | |
| tree | 974e50993e00d046e28027efef39e3d2e303f782 | |
| parent | Update readme (diff) | |
| download | paper2remarkable-2b4fc42e99f08052fe73f92845f4b155d05fee25.tar.gz paper2remarkable-2b4fc42e99f08052fe73f92845f4b155d05fee25.zip | |
Carry cookies over when redirecting
This was needed for ACM, and is likely beneficial
for other sites as well.
| -rw-r--r-- | paper2remarkable/utils.py | 8 |
1 files changed, 5 insertions, 3 deletions
diff --git a/paper2remarkable/utils.py b/paper2remarkable/utils.py index cc8a417..de27973 100644 --- a/paper2remarkable/utils.py +++ b/paper2remarkable/utils.py @@ -96,15 +96,17 @@ def get_page_with_retry(url, tries=5): def follow_redirects(url): - """Follow redirects from the URL (at most 10)""" + """Follow redirects from the URL (at most 100)""" it = 0 - while it < 10: - req = requests.head(url, allow_redirects=False) + jar = {} + while it < 100: + req = requests.head(url, allow_redirects=False, cookies=jar) if req.status_code == 200: break if not "Location" in req.headers: break url = req.headers["Location"] + jar = req.cookies it += 1 return url |
