Normalize before removing wrong letters

2025-06-29 10:30:55 +02:00 · 2020-10-02 16:59:58 +02:00
parent 8fa724e848
commit 3edc3ffa02
1 changed files with 1 additions and 1 deletions
--- a/media/forms.py
+++ b/media/forms.py
@ -31,7 +31,6 @@ def generate_side_identifier(title, authors, subtitle=None):
    title_normalized = re.sub(r'^THE ', '', title_normalized)
    title_normalized = re.sub(r'Œ', 'OE', title_normalized)
    title_normalized = title_normalized.replace(' ', '')
-    title_normalized = re.sub("[^A-Z0-9$]", "", title_normalized)
    title_normalized = ''.join(
        char
        for char in unicodedata.normalize(
@ -39,6 +38,7 @@ def generate_side_identifier(title, authors, subtitle=None):
        if all(not unicodedata.category(char).startswith(cat)
               for cat in {'M', 'P', 'Z', 'C'}) or char == ' '
    ).casefold().upper()
+    title_normalized = re.sub("[^A-Z0-9$]", "", title_normalized)
    authors = authors.copy()

    def sort(author):