[cgit] Refactor script (#216)

Make the script more readable, mostly by:

- using the endoflife.Product class,
- introducing the endoflife.AutoConfig class to make it easier to manage such configuration,
- removing the unnecessary use of functions,
- a little bit of renaming.
This commit is contained in:
Marc Wrobel
2023-12-10 16:26:47 +01:00
committed by GitHub
parent aa7975d7f1
commit 0836c270ea
2 changed files with 83 additions and 55 deletions

View File

@@ -1,60 +1,42 @@
import re
import sys
from bs4 import BeautifulSoup
from common import http
from common import dates
from common import endoflife
from liquid import Template
"""Fetch versions with their dates from a cgit repository, such as
https://git.kernel.org/pub/scm/linux/kernel/git/stable/linux.git.
Ideally we would want to use the git repository directly, but cgit repositories
do not support partial clone so we cannot.
"""
METHOD = 'cgit'
def fetch_releases(url, regex, template):
releases = {}
response = http.fetch_url(url + '/refs/tags')
soup = BeautifulSoup(response.text, features="html5lib")
l_template = Template(template)
for table in soup.find_all("table", class_="list"):
for row in table.find_all("tr"):
columns = row.find_all("td")
if len(columns) == 4:
version_text = columns[0].text.strip()
datetime_td = columns[3].find_next("span")
datetime_text = datetime_td.attrs["title"] if datetime_td else None
if datetime_text:
matches = re.match(regex.strip(), version_text)
if matches:
match_data = matches.groupdict()
version_string = l_template.render(**match_data)
date = dates.parse_datetime(datetime_text).strftime("%Y-%m-%d")
print(f"{version_string} : {date}")
releases[version_string] = date
return releases
def update_product(product_name, configs):
versions = {}
for config in configs:
t = config.get("template", endoflife.DEFAULT_TAG_TEMPLATE)
regex = config.get("regex", endoflife.DEFAULT_VERSION_REGEX)
versions = versions | fetch_releases(config[METHOD], regex, t)
endoflife.write_releases(product_name, versions)
"""Fetches versions from repositories managed with cgit, such as the Linux kernel repository.
Ideally we would want to use the git repository directly, but cgit-managed repositories don't support partial clone."""
METHOD = "cgit"
p_filter = sys.argv[1] if len(sys.argv) > 1 else None
for product, configs in endoflife.list_products(METHOD, p_filter).items():
print(f"::group::{product}")
update_product(product, configs)
for product_name, configs in endoflife.list_products(METHOD, p_filter).items():
print(f"::group::{product_name}")
product = endoflife.Product(product_name, load_product_data=True)
for auto_config in product.get_auto_configs(METHOD):
response = http.fetch_url(auto_config.url + '/refs/tags')
soup = BeautifulSoup(response.text, features="html5lib")
for table in soup.find_all("table", class_="list"):
for row in table.find_all("tr"):
columns = row.find_all("td")
if len(columns) != 4:
continue
version_str = columns[0].text.strip()
version_match = auto_config.first_match(version_str)
if not version_match:
continue
datetime_td = columns[3].find_next("span")
datetime_str = datetime_td.attrs["title"] if datetime_td else None
if not datetime_str:
continue
version = auto_config.render(version_match)
date = dates.parse_datetime(datetime_str)
product.declare_version(version, date)
product.write()
print("::endgroup::")