matthewdeanmartin · November 13, 2025 13:43
diff --git a/folding.py b/folding.py
 import re
 import unicodedata


 def strip_accents(s: str) -> str:
    # NFD: decomposes "ï" -> "i" + "¨"
    # Then we drop all combining marks (category "Mn")
    return "".join(
        c for c in unicodedata.normalize("NFD", s)
        if unicodedata.category(c) != "Mn"
    )


 def findall_accent_insensitive(pattern: str, text: str):
    norm_text = strip_accents(text)
    norm_pattern = strip_accents(pattern)

    regex = re.compile(norm_pattern)
    return [text[m.start():m.end()] for m in regex.finditer(norm_text)]


 txt = "j'ai croisé raïssa hier"
 print(findall_accent_insensitive("rai", txt))
 # -> ['raï']

 # ref: https://elk.zone/mastodon.social/@[email protected]/115541819305981530
	import re
	import unicodedata


	def strip_accents(s: str) -> str:
	# NFD: decomposes "ï" -> "i" + "¨"
	# Then we drop all combining marks (category "Mn")
	return "".join(
	c for c in unicodedata.normalize("NFD", s)
	if unicodedata.category(c) != "Mn"
	)


	def findall_accent_insensitive(pattern: str, text: str):
	norm_text = strip_accents(text)
	norm_pattern = strip_accents(pattern)

	regex = re.compile(norm_pattern)
	return [text[m.start():m.end()] for m in regex.finditer(norm_text)]


	txt = "j'ai croisé raïssa hier"
	print(findall_accent_insensitive("rai", txt))
	# -> ['raï']

	# ref: https://elk.zone/mastodon.social/@[email protected]/115541819305981530
No results found