#!/usr/bin/env python3 import os import re import sys pattern = r']*class=[\'"][^\'"]*evcal_evdata_row evo_clik_row[^\'"]*[\'"][^>]*href=[\'"]([^\'"]+)[\'"][^>]*>' for slug in sys.argv[1:]: page_path = os.path.join("events", slug, "page.html") event_url_path = os.path.join("events", slug, "event-url") if os.path.exists(event_url_path): continue with open(page_path, "r") as f: page_content = f.read() match = re.search(pattern, page_content) if not match: print(f"event {slug} has no event url") continue event_page_url = match.group(1) with open(event_url_path, "w") as f: f.write(event_page_url)