Compare commits

...

4 commits

Author SHA1 Message Date
Kévin Commaille a23985296e
Simplify code to replace shortcodes
Signed-off-by: Kévin Commaille <zecakeh@tedomum.fr>
2025-05-06 12:09:28 +02:00
Kévin Commaille c1c90a6b3b
Fix and split regex
Signed-off-by: Kévin Commaille <zecakeh@tedomum.fr>
2025-05-06 11:20:56 +02:00
Kévin Commaille 163bfe7c2c
Improve doc
Signed-off-by: Kévin Commaille <zecakeh@tedomum.fr>
2025-05-06 10:53:49 +02:00
Kévin Commaille 69adb6b270
Remove trailing whitespaces
Signed-off-by: Kévin Commaille <zecakeh@tedomum.fr>
2025-05-06 10:52:47 +02:00

View file

@ -37,10 +37,10 @@ api_dir = os.path.join(os.path.dirname(scripts_dir), "data", "api")
# A shortcode is defined as (newlines and whitespaces for presentation purpose): # A shortcode is defined as (newlines and whitespaces for presentation purpose):
# #
# {{% # {{%
# <one or more whitespaces> # <zero or more whitespaces>
# <name of shortcode> # <name of shortcode>
# <one or more whitespaces> # (optional <one or more whitespaces><list of parameters>)
# (optional <list of parameters><one or more whitespaces>) # <zero or more whitespaces>
# %}} # %}}
# #
# With: # With:
@ -48,7 +48,12 @@ api_dir = os.path.join(os.path.dirname(scripts_dir), "data", "api")
# * <name of shortcode>: any word character and `-` and `/`. # * <name of shortcode>: any word character and `-` and `/`.
# * <list of parameters>: any character except `}`, must not start or end with a # * <list of parameters>: any character except `}`, must not start or end with a
# whitespace. # whitespace.
shortcode_regex = re.compile(r"\{\{\%\s+(?P<name>[\w\/-]+)\s+(?:(?P<params>[^\s\}][^\}]+[^\s\}])\s+)?\%\}\}", re.ASCII) shortcode_regex = re.compile(r"""\{\{\% # {{%
\s* # zero or more whitespaces
(?P<name>[\w/-]+) # name of shortcode
(?:\s+(?P<params>[^\s\}][^\}]+[^\s\}]))? # optional list of parameters
\s* # zero or more whitespaces
\%\}\} # %}}""", re.ASCII | re.VERBOSE)
# Parses the parameters of a Hugo shortcode. # Parses the parameters of a Hugo shortcode.
# #
@ -67,11 +72,11 @@ def prefix_absolute_path_references(text, base_url):
""" """
return text.replace("](/", "]({}/".format(base_url)) return text.replace("](/", "]({}/".format(base_url))
def replace_match(text, match, replacement): def replace_match(match, replacement):
"""Replaces the regex match by the replacement in the text.""" """Replaces the regex match by the replacement in the text."""
return text[:match.start()] + replacement + text[match.end():] return match.string[:match.start()] + replacement + match.string[match.end():]
def replace_shortcode(text, shortcode): def replace_shortcode(shortcode):
"""Replaces the shortcode by a Markdown fallback in the text. """Replaces the shortcode by a Markdown fallback in the text.
The supported shortcodes are: The supported shortcodes are:
@ -82,32 +87,37 @@ def replace_shortcode(text, shortcode):
if shortcode['name'].startswith("/"): if shortcode['name'].startswith("/"):
# This is the end of the shortcode, just remove it. # This is the end of the shortcode, just remove it.
return replace_match(text, shortcode['match'], "") return replace_match(shortcode, "")
# Parse the parameters of the shortcode
params = {}
if shortcode['params']:
for param in shortcode_params_regex.finditer(shortcode['params']):
if param['key']:
params[param['key']] = param['value']
match shortcode['name']: match shortcode['name']:
case "boxes/note": case "boxes/note":
text = replace_match(text, shortcode['match'], "**NOTE:** ") return replace_match(shortcode, "**NOTE:** ")
case "boxes/rationale": case "boxes/rationale":
text = replace_match(text, shortcode['match'], "**RATIONALE:** ") return replace_match(shortcode, "**RATIONALE:** ")
case "boxes/warning": case "boxes/warning":
text = replace_match(text, shortcode['match'], "**WARNING:** ") return replace_match(shortcode, "**WARNING:** ")
case "added-in": case "added-in":
version = shortcode['params']['v'] version = params['v']
if not version: if not version:
raise ValueError("Missing parameter `v` for `added-in` shortcode") raise ValueError("Missing parameter `v` for `added-in` shortcode")
text = replace_match(text, shortcode['match'], f"**[Added in `v{version}`]** ") return replace_match(shortcode, f"**[Added in `v{version}`]** ")
case "changed-in": case "changed-in":
version = shortcode['params']['v'] version = params['v']
if not version: if not version:
raise ValueError("Missing parameter `v` for `changed-in` shortcode") raise ValueError("Missing parameter `v` for `changed-in` shortcode")
text = replace_match(text, shortcode['match'], f"**[Changed in `v{version}`]** ") return replace_match(shortcode, f"**[Changed in `v{version}`]** ")
case _: case _:
raise ValueError("Unknown shortcode", shortcode['name']) raise ValueError("Unknown shortcode", shortcode['name'])
return text
def find_and_replace_shortcodes(text): def find_and_replace_shortcodes(text):
"""Finds Hugo shortcodes and replaces them by a Markdown fallback. """Finds Hugo shortcodes and replaces them by a Markdown fallback.
@ -120,20 +130,8 @@ def find_and_replace_shortcodes(text):
# We use a `while` loop with `search` instead of a `for` loop with # We use a `while` loop with `search` instead of a `for` loop with
# `finditer`, because as soon as we start replacing text, the # `finditer`, because as soon as we start replacing text, the
# indices of the match are invalid. # indices of the match are invalid.
while match := shortcode_regex.search(text): while shortcode := shortcode_regex.search(text):
# Parse the parameters of the shortcode text = replace_shortcode(shortcode)
params = {}
if match['params']:
for param in shortcode_params_regex.finditer(match['params']):
if param['key']:
params[param['key']] = param['value']
shortcode = {
'name': match['name'],
'params': params,
'match': match,
}
text = replace_shortcode(text, shortcode)
return text return text
@ -143,7 +141,7 @@ def edit_descriptions(node, base_url):
The fixes that are applied are: The fixes that are applied are:
* Make links absolute * Make links absolute
* Replace shortcodes * Replace Hugo shortcodes
""" """
if isinstance(node, dict): if isinstance(node, dict):
for key in node: for key in node: