unicode normalize in sanitize function

feature-unify_handlers
Tomáš Mládek 2019-05-23 14:36:12 +02:00
parent 89db7e885a
commit 71a5fd3522
1 changed files with 3 additions and 0 deletions

View File

@ -8,6 +8,7 @@ import re
import shutil
import sys
import tempfile
import unicodedata
from configparser import ConfigParser
from datetime import datetime, timedelta
from glob import glob
@ -92,10 +93,12 @@ class DelojzaBot:
return True
return False
# https://github.com/django/django/blob/master/django/utils/text.py#L393
@staticmethod
def sanitize(filepath):
if filepath is None:
return None
filepath = unicodedata.normalize('NFKD', filepath).encode('ascii', 'ignore').decode('ascii')
return re.sub(r'[^\w.()\[\]{}#-]', '_', filepath)
def tag_file(self, filepath, message, info=None):