It may not be the best place for that (gha.py would have been better), but it's the shorter / faster way to do it for now. Moreover it now uses logging for writing the group. The logger format has been updated for this to work. This was done to fix issues on GitHub Action logs, where groups were declared after the logs.
30 lines
1.2 KiB
Python
30 lines
1.2 KiB
Python
import sys
|
|
|
|
from bs4 import BeautifulSoup
|
|
from common import dates, endoflife, http
|
|
|
|
METHOD = 'distrowatch'
|
|
|
|
p_filter = sys.argv[1] if len(sys.argv) > 1 else None
|
|
for product_name in endoflife.list_products(METHOD, p_filter):
|
|
product = endoflife.Product(product_name)
|
|
product_frontmatter = endoflife.ProductFrontmatter(product.name)
|
|
for config in product_frontmatter.get_auto_configs(METHOD):
|
|
response = http.fetch_url(f"https://distrowatch.com/index.php?distribution={config.url}")
|
|
soup = BeautifulSoup(response.text, features="html5lib")
|
|
|
|
for table in soup.select("td.News1>table.News"):
|
|
headline = table.select_one("td.NewsHeadline a[href]").get_text().strip()
|
|
versions_match = config.first_match(headline)
|
|
if not versions_match:
|
|
continue
|
|
|
|
# multiple versions may be released at once (e.g. Ubuntu 16.04.7 and 18.04.5)
|
|
versions = config.render(versions_match).split("\n")
|
|
date = dates.parse_date(table.select_one("td.NewsDate").get_text())
|
|
|
|
for version in versions:
|
|
product.declare_version(version, date)
|
|
|
|
product.write()
|