From 61ee46eb34ccdb8ec7ff4e0de17614d901080284 Mon Sep 17 00:00:00 2001 From: fmk17 <fmk17@inf.ufpr.br> Date: Thu, 17 Nov 2022 17:10:18 -0300 Subject: [PATCH] Add user-agent bypass --- crawler.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/crawler.py b/crawler.py index 9c15030..b25e209 100644 --- a/crawler.py +++ b/crawler.py @@ -34,7 +34,7 @@ def get_location_days( ): return cached_responses[location] - response = requests.get(location.url) + response = requests.get(location.url, headers={'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64; rv:107.0) Gecko/20100101 Firefox/107.0'}) soup = BeautifulSoup(response.text, "lxml") post = soup.select_one("#post div:nth-child(3)") -- GitLab