Add Unicode NFKC normalization of paths. Somebody just tried to access /wg/ipfix/charter/ with 'fi' composed as a ligature \ufb01...

- Legacy-Id: 2253
This commit is contained in:
Henrik Levkowetz 2010-05-11 10:11:24 +00:00
parent 0573415958
commit 8f74caf7d2
2 changed files with 20 additions and 0 deletions

View file

@ -9,6 +9,7 @@ import re
import smtplib
import sys
import traceback
import unicodedata
class SQLLogMiddleware(object):
def process_response(self, request, response):
@ -39,3 +40,21 @@ class RedirectTrailingPeriod(object):
if response.status_code == 404 and request.path.endswith("."):
return HttpResponsePermanentRedirect(request.path.rstrip("."))
return response
class UnicodeNfkcNormalization(object):
def process_request(self, request):
"""Do Unicode NFKC normalization to turn ligatures into individual characters.
This was prompted by somebody actually requesting an url for /wg/ipfix/charter
where the 'fi' was composed of an \ufb01 ligature...
There are probably other elements of a request which may need this normalization
too, but let's put that in as it comes up, rather than guess ahead.
"""
if request.META["PATH_INFO"].startswith("/wg/"):
print "-------->>"
request.META["PATH_INFO"] = unicodedata.normalize('NFKC', request.META["PATH_INFO"])
request.path_info = unicodedata.normalize('NFKC', request.path_info)
print repr(request)
print "--------<<"
return None

View file

@ -91,6 +91,7 @@ MIDDLEWARE_CLASSES = (
'ietf.middleware.SMTPExceptionMiddleware',
'ietf.middleware.RedirectTrailingPeriod',
'django.middleware.transaction.TransactionMiddleware',
'ietf.middleware.UnicodeNfkcNormalization',
)
ROOT_URLCONF = 'ietf.urls'