diff options
| author | diogo464 <[email protected]> | 2025-07-24 12:36:27 +0100 |
|---|---|---|
| committer | diogo464 <[email protected]> | 2025-07-24 12:36:27 +0100 |
| commit | 6138d43d3ff8736bbcb95e4e34cdbb3f79f4d7cc (patch) | |
| tree | dab2a28fa339cfd2f8f64d0887d700acb1328921 /setup-directories | |
| parent | 9111cb454a6ea62dacbafad49a0aabafc7066bf8 (diff) | |
fix: urldecode the slug field
Diffstat (limited to 'setup-directories')
| -rwxr-xr-x | setup-directories | 4 |
1 files changed, 3 insertions, 1 deletions
diff --git a/setup-directories b/setup-directories index d3548b14f..ab94676b1 100755 --- a/setup-directories +++ b/setup-directories | |||
| @@ -4,6 +4,8 @@ import os | |||
| 4 | import shutil | 4 | import shutil |
| 5 | import xml.etree.ElementTree as ET | 5 | import xml.etree.ElementTree as ET |
| 6 | 6 | ||
| 7 | from urllib.parse import unquote | ||
| 8 | |||
| 7 | ignored_urls = ["https://www.portugalrunning.com/eventos/"] | 9 | ignored_urls = ["https://www.portugalrunning.com/eventos/"] |
| 8 | tree = ET.parse("sitemap.xml") | 10 | tree = ET.parse("sitemap.xml") |
| 9 | root = tree.getroot() | 11 | root = tree.getroot() |
| @@ -28,7 +30,7 @@ for url_element in root.findall(".//{*}url"): | |||
| 28 | 30 | ||
| 29 | slug = re.match("https://www.portugalrunning.com/eventos/([^/]*)/", url) | 31 | slug = re.match("https://www.portugalrunning.com/eventos/([^/]*)/", url) |
| 30 | assert slug is not None, f"failed to extract slug from '{url}'" | 32 | assert slug is not None, f"failed to extract slug from '{url}'" |
| 31 | slug = slug[1] | 33 | slug = unquote(slug[1]) |
| 32 | 34 | ||
| 33 | event_dir = os.path.join("events", slug) | 35 | event_dir = os.path.join("events", slug) |
| 34 | page_path = os.path.join(event_dir, "page.html") | 36 | page_path = os.path.join(event_dir, "page.html") |
