From 0ca092f78e297198255e1681624937060f211bf7 Mon Sep 17 00:00:00 2001 From: Charles Tapley Hoyt Date: Thu, 15 Feb 2024 10:39:47 +0100 Subject: [PATCH] Enable timeouts when getting soup --- src/bioversions/utils.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/bioversions/utils.py b/src/bioversions/utils.py index 8c0b1225..3192e929 100644 --- a/src/bioversions/utils.py +++ b/src/bioversions/utils.py @@ -47,9 +47,9 @@ def norm(s: str) -> str: return s.lower().replace(" ", "").replace("-", "").replace(".", "") -def get_soup(url: str, verify: bool = True) -> BeautifulSoup: +def get_soup(url: str, verify: bool = True, timeout: Optional[int] = None) -> BeautifulSoup: """Get a beautiful soup parsed version of the given web page.""" - res = requests.get(url, verify=verify) + res = requests.get(url, verify=verify, timeout=timeout or 3) soup = BeautifulSoup(res.text, features="html.parser") return soup