Files
endoflife-date-release-data/src/splunk.py
Marc Wrobel 56cc29b49d Make releasedata.Product usable in 'with' expression (#294)
This way the writing of the JSON file is handled automatically if the update does not fail.
It pave the way to further global improvements, such as a better error handling.
2024-02-04 14:48:05 +01:00

48 lines
2.2 KiB
Python

import re
from bs4 import BeautifulSoup
from common import dates, http, releasedata
VERSION_DATE_PATTERN = re.compile(r"Splunk Enterprise (?P<version>\d+\.\d+(?:\.\d+)*) was (?:first )?released on (?P<date>\w+\s\d\d?,\s\d{4})\.", re.MULTILINE)
def get_latest_minor_versions(versions: list[str]) -> list[str]:
versions_split = [v.split('.') for v in versions]
# Group versions by major and minor version
version_groups = {}
for version in versions_split:
major, minor = map(int, version[:2])
# Release notes for versions before 7.2 don't contain release information
if major < 7 or (major == 7 and minor < 2):
continue
major_minor = '.'.join(version[:2])
if major_minor not in version_groups:
version_groups[major_minor] = []
version_groups[major_minor].append(version)
# For each group, find the version with the highest patch version
latest_versions = []
for version_group in version_groups.values():
latest_patch = max(version_group, key=lambda v: int(v[2]))
latest_versions.append('.'.join(latest_patch))
return latest_versions
with releasedata.ProductData("splunk") as product_data:
main = http.fetch_url("https://docs.splunk.com/Documentation/Splunk")
soup = BeautifulSoup(main.text, features="html5lib")
all_versions = [option.attrs['value'] for option in soup.select("select#version-select > option")]
# Latest minor release notes contains release notes for all previous minor versions.
# For example, 9.0.5 release notes also contains release notes for 9.0.0 to 9.0.4.
latest_minor_versions = get_latest_minor_versions(all_versions)
latest_minor_versions_urls = [f"https://docs.splunk.com/Documentation/Splunk/{v}/ReleaseNotes/MeetSplunk" for v in latest_minor_versions]
for response in http.fetch_urls(latest_minor_versions_urls):
for (version_str, date_str) in VERSION_DATE_PATTERN.findall(response.text):
version_str = f"{version_str}.0" if len(version_str.split(".")) == 2 else version_str # convert x.y to x.y.0
date = dates.parse_date(date_str)
product_data.declare_version(version_str, date)