Improve HTTP handling in scripts (#449)

Provide some helper methods to hide the complexity of parsing HTML, JSON, YAML, XML or Markdown.
2025-06-28 11:46:04 +02:00
parent fda4967c38
commit 312ce078bb
43 changed files with 103 additions and 137 deletions
--- a/src/amazon-eks.py
+++ b/src/amazon-eks.py
@@ -1,6 +1,5 @@
 import logging

-from bs4 import BeautifulSoup
 from common import dates, endoflife, http, releasedata

 """Fetches EKS versions from AWS docs.
@@ -8,8 +7,8 @@ Now that AWS no longer publishes docs on GitHub, we use the Web Archive to get t

 for config in endoflife.list_configs_from_argv():
    with releasedata.ProductData(config.product) as product_data:
-        response = http.fetch_url(config.url)
-        html = BeautifulSoup(response.text, features="html5lib")
+        html = http.fetch_html(config.url)
+
        for tr in html.select("#main-col-body")[0].findAll("tr"):
            cells = tr.findAll("td")
            if not cells: