[discourse] Add auto method (#515)

Closes #505.
This commit is contained in:
Marc Wrobel
2025-09-11 12:21:20 +02:00
committed by GitHub
parent add9ee5bed
commit d190da8073
2 changed files with 31 additions and 0 deletions

View File

@@ -58,6 +58,7 @@ def parse_datetime(text: str, formats: list[str] = frozenset([
"%a %d %b %Y %H:%M:%S %z", # Wed 01 Jan 2020 00:00:00 -0400
"%a %b %d %H:%M:%S %Z %Y", # Wed Jan 01 00:00:00 UTC 2020
"%a %b %d %H:%M:%S %z %Y", # Wed Jan 01 00:00:00 -0400 2020
"%b %d %Y %I:%M %p", # Jan 1 2020 0:00 pm
"%Y%m%d%H%M%S", # 20230501083234
]), to_utc: bool = True) -> datetime:
"""Parse a given text representing a datetime using a list of formats,

30
src/discourse.py Normal file
View File

@@ -0,0 +1,30 @@
import logging
import re
from bs4 import BeautifulSoup
from common import dates, http
from common.releasedata import ProductData, config_from_argv
"""Fetch versions from a discourse server."""
config = config_from_argv()
with ProductData(config.product) as product_data:
html = BeautifulSoup(http.fetch_javascript_url(config.url))
for topic in html.select("tr.topic-list-item"):
title = topic.select_one("span.link-top-line").get_text(strip=True)
versions = config.first_match(title)
if not versions:
logging.debug("Skipping %s: does not match regex", title)
continue
name = config.render(versions)
print(topic)
date_str = topic.select_one("td.activity").get("title").strip()
date_match = re.search(r"Created:\s*([A-Za-z]+\s+\d{1,2},\s+\d{4}\s+\d{1,2}:\d{2}\s+[ap]m)", date_str)
if not date_match:
logging.debug("Skipping %s: no created date found", title)
continue
date = dates.parse_datetime(date_match.group(1))
product_data.declare_version(name, date)