from bs4 import BeautifulSoup from datetime import datetime, timezone, timedelta import time def parse_maimaidx_intl_prism_news_site(html: str): soup = BeautifulSoup(html, "html.parser") items = soup.select(".dl--pop__item") entries = [] for item in items: date_text = item.select_one(".dl--pop__head").text.strip().replace(" UP", "") dt = datetime.strptime(date_text, "%Y.%m.%d").replace(tzinfo=timezone(timedelta(hours=9))) timestamp = int(dt.timestamp()) img_tag = item.select_one("a.dl--pop__thumb img") image_url = img_tag["srcset"] if img_tag else None full_image_url = image_url.replace("../", "https://maimai.sega.jp/") if image_url else None entry = { "date": date_text, "identifier": "MAIMAIDX_INTL_PRISM", "type": None, "timestamp": timestamp, "headline": None, "content": f"New maimai DX International News / maimai DX International の新しいお知らせ\n\n{full_image_url}", "url": None, "images": [ { "image": full_image_url, "link": None } ] } entries.append(entry) return entries