[virtualbox] Add automation (#438)

Using https://www.virtualbox.org/wiki/Download_Old_Builds.
This commit is contained in:
Marc Wrobel
2025-05-17 11:25:54 +02:00
parent dacf569bfc
commit aa43bf6602
2 changed files with 36 additions and 0 deletions

View File

@@ -25,6 +25,7 @@ def parse_month_year_date(text: str, formats: list[str] = frozenset([
"%B %Y", # January 2020
"%b %Y", # Jan 2020
"%Y-%m", # 2020-01
"%Y/%m", # 2020/01
"%m-%Y", # 01-2020
"%m/%Y", # 01/2020
])) -> datetime:

35
src/virtualbox.py Normal file
View File

@@ -0,0 +1,35 @@
import logging
import re
from bs4 import BeautifulSoup
from common import dates, http, releasedata
"""Fetches releases from VirtualBox download page."""
RELEASE_REGEX = re.compile(r"^VirtualBox (?P<value>\d+\.\d+)$")
EOL_REGEX = re.compile(r"^\(no longer supported, support ended (?P<value>\d{4}/\d{2})\)$")
with releasedata.ProductData("virtualbox") as product_data:
response = http.fetch_url("https://www.virtualbox.org/wiki/Download_Old_Builds")
soup = BeautifulSoup(response.text, features="html5lib")
for li in soup.select_one("#DownloadVirtualBoxOldBuilds + ul").find_all("li"):
li_text = li.find("a").text.strip()
release_match = RELEASE_REGEX.match(li_text)
if not release_match:
logging.info(f"Skipping '{li_text}': does not match {RELEASE_REGEX}")
continue
release_name = release_match.group("value")
release = product_data.get_release(release_name)
eol_text = li.find("em").text.lower().strip()
eol_match = EOL_REGEX.match(eol_text)
if not eol_match:
logging.info(f"Ignoring '{eol_text}': does not match {EOL_REGEX}")
continue
eol_date_str = eol_match.group("value")
eol_date = dates.parse_month_year_date(eol_date_str)
release.set_eol(eol_date)