summaryrefslogtreecommitdiff
path: root/django/middleware/common.py
diff options
context:
space:
mode:
authorAymeric Augustin <aymeric.augustin@m4x.org>2015-11-26 21:27:12 +0100
committerAymeric Augustin <aymeric.augustin@m4x.org>2015-11-26 21:27:12 +0100
commit11f10b70f3cb21c7a7f859e417adee104758221b (patch)
treee7f90018003749eb446eb276ebc98ba7dd95b116 /django/middleware/common.py
parentcc2ca9c550fbf8fca8684b373a3c8e3618eea08e (diff)
Fixed #25302 (again) -- Ignored scheme when checking for bad referers.
The check introduced in 4ce433e was too strict in real life. The poorly implemented bots this patch attempted to ignore are sloppy when it comes to http vs. https.
Diffstat (limited to 'django/middleware/common.py')
-rw-r--r--django/middleware/common.py17
1 files changed, 11 insertions, 6 deletions
diff --git a/django/middleware/common.py b/django/middleware/common.py
index fa38c63a24..5aeb746f81 100644
--- a/django/middleware/common.py
+++ b/django/middleware/common.py
@@ -8,6 +8,7 @@ from django.core.exceptions import PermissionDenied
from django.core.mail import mail_managers
from django.utils.cache import get_conditional_response, set_response_etag
from django.utils.encoding import force_text
+from django.utils.six.moves.urllib.parse import urlparse
logger = logging.getLogger('django.request')
@@ -163,13 +164,17 @@ class BrokenLinkEmailsMiddleware(object):
according to project settings or in three specific situations:
- If the referer is empty.
- If a '?' in referer is identified as a search engine source.
- - If the referer is equal to the current URL (assumed to be a
- malicious bot).
+ - If the referer is equal to the current URL, ignoring the scheme
+ (assumed to be a poorly implemented bot).
"""
- full_url = "%s://%s/%s" % (request.scheme, domain, uri.lstrip('/'))
- if (not referer or
- (not self.is_internal_request(domain, referer) and '?' in referer) or
- (referer == uri or referer == full_url)):
+ if not referer:
+ return True
+
+ if not self.is_internal_request(domain, referer) and '?' in referer:
+ return True
+
+ parsed_referer = urlparse(referer)
+ if parsed_referer.netloc in ['', domain] and parsed_referer.path == uri:
return True
return any(pattern.search(uri) for pattern in settings.IGNORABLE_404_URLS)