[Author Prev][Author Next][Thread Prev][Thread Next][Author Index][Thread Index]
[or-cvs] [torflow/master 34/92] HTTP 3xx redirect handling
Author: John M. Schanck <john@xxxxxxxxxxx>
Date: Tue, 27 Jul 2010 12:32:55 -0400
Subject: HTTP 3xx redirect handling
Commit: c5765a46ff52f2cbaa79b4a2e0dee99d042f9baa
Added new inconclusive and failure cases for redirects. Non-tor
redirects return an inconclusive test result and an attempt to add the
redirect location to the target list. Previously when the HTTP test
requested a binary file that redirected to a dynamic html page, the
binary file's url would be marked as FailureDynamic. Now it'll be
marked as InconclusiveRedirect. Tor only redirects result in
FailureRedirect.
---
NetworkScanners/ExitAuthority/libsoat.py | 22 +++++++++--
NetworkScanners/ExitAuthority/soat.py | 60 ++++++++++++++++++++++++-----
2 files changed, 67 insertions(+), 15 deletions(-)
diff --git a/NetworkScanners/ExitAuthority/libsoat.py b/NetworkScanners/ExitAuthority/libsoat.py
index 69cec3c..f5916a9 100644
--- a/NetworkScanners/ExitAuthority/libsoat.py
+++ b/NetworkScanners/ExitAuthority/libsoat.py
@@ -45,18 +45,18 @@ __all__ = [ # Classes
"TEST_SUCCESS", "TEST_INCONCLUSIVE", "TEST_FAILURE",
"RESULT_STRINGS", "RESULT_CODES",
"INCONCLUSIVE_NOLOCALCONTENT", "INCONCLUSIVE_DYNAMICSSL",
- "INCONCLUSIVE_TORBREAKAGE", "INCONCLUSIVE_NOEXIT",
+ "INCONCLUSIVE_TORBREAKAGE", "INCONCLUSIVE_NOEXIT", "INCONCLUSIVE_REDIRECT",
"FAILURE_EXITONLY", "FAILURE_DYNAMIC", "FAILURE_COOKIEMISMATCH", "FAILURE_BADHTTPCODE",
"FAILURE_NOEXITCONTENT", "FAILURE_EXITTRUNCATION", "FAILURE_SOCKSERROR",
- "FAILURE_HOSTUNREACH", "FAILURE_NETUNREACH", "FAILURE_EXITPOLICY",
- "FAILURE_CONNREFUSED", "FAILURE_CONNERROR", "FAILURE_URLERROR", "FAILURE_CRYPTOERROR",
+ "FAILURE_HOSTUNREACH", "FAILURE_NETUNREACH", "FAILURE_EXITPOLICY", "FAILURE_CONNREFUSED",
+ "FAILURE_CONNERROR", "FAILURE_URLERROR", "FAILURE_REDIRECT", "FAILURE_CRYPTOERROR",
"FAILURE_TIMEOUT", "FAILURE_SLOWXFER", "FAILURE_HEADERCHANGE", "FAILURE_MISCEXCEPTION",
"FALSEPOSITIVE_HTTPERRORS", "FALSEPOSITIVE_DYNAMIC", "FALSEPOSITIVE_DYNAMIC_TOR",
"FALSEPOSITIVE_DEADSITE",
"E_SOCKS", "E_POLICY", "E_NETUNREACH", "E_HOSTUNREACH", "E_REFUSED",
"E_TIMEOUT", "E_SLOWXFER", "E_NOCONTENT", "E_CRYPTO", "E_URL", "E_MISC",
# Exception classes
- "SlowXferException",
+ "SlowXferException", "RedirectException", "NoURLsFound",
]
@@ -90,6 +90,7 @@ INCONCLUSIVE_NOLOCALCONTENT = "InconclusiveNoLocalContent"
INCONCLUSIVE_DYNAMICSSL = "InconclusiveDynamicSSL"
INCONCLUSIVE_TORBREAKAGE = "InconclusiveTorBreakage"
INCONCLUSIVE_NOEXIT = "InconclusiveNoExit"
+INCONCLUSIVE_REDIRECT = "InconclusiveRedirect"
# Failed reasons
FAILURE_EXITONLY = "FailureExitOnly"
@@ -105,6 +106,7 @@ FAILURE_EXITPOLICY = "FailureExitPolicy"
FAILURE_CONNREFUSED = "FailureConnRefused"
FAILURE_CONNERROR = "FailureConnError"
FAILURE_URLERROR = "FailureURLError"
+FAILURE_REDIRECT = "FailureRedirect"
FAILURE_CRYPTOERROR = "FailureCryptoError"
FAILURE_TIMEOUT = "FailureTimeout"
FAILURE_SLOWXFER = "FailureSlowXfer"
@@ -1145,3 +1147,15 @@ class JSSoupDiffer(JSDiffer):
class SlowXferException(Exception):
pass
+
+class RedirectException(Exception):
+ def __init__(self, code, orig, new):
+ self.code = code
+ self.orig_url = orig
+ self.new_url = new
+
+ def __str__(self):
+ return "HTTP %d Redirect: %s --> %s" % (self.code, self.orig_url, self.new_url)
+
+class NoURLsFound(Exception):
+ pass
diff --git a/NetworkScanners/ExitAuthority/soat.py b/NetworkScanners/ExitAuthority/soat.py
index 585bf1a..2eaf00c 100755
--- a/NetworkScanners/ExitAuthority/soat.py
+++ b/NetworkScanners/ExitAuthority/soat.py
@@ -174,6 +174,17 @@ class NoDNSHTTPHandler(urllib2.HTTPHandler):
def http_open(self, req):
return self.do_open(NoDNSHTTPConnection, req)
+class NullRedirectHandler(urllib2.HTTPRedirectHandler):
+ def http_error_301(self, req, fp, code, msg, headers):
+ if 'location' in headers:
+ newurl = headers.getheaders('location')[0]
+ elif 'uri' in headers:
+ newurl = headers.getheaders('uri')[0]
+ else:
+ return # pass through to http_error_default
+ raise RedirectException(code, req.get_full_url(), newurl)
+ http_error_302 = http_error_303 = http_error_307 = http_error_301
+
class ExitScanHandler(ScanSupport.ScanHandler):
def __init__(self, c, selmgr, strm_selector):
ScanSupport.ScanHandler.__init__(self, c, selmgr,
@@ -310,13 +321,14 @@ def http_request(address, cookie_jar=None, headers=firefox_headers):
try:
plog("DEBUG", "Starting request for: "+address)
if cookie_jar != None:
- opener = urllib2.build_opener(NoDNSHTTPHandler, urllib2.HTTPCookieProcessor(cookie_jar))
+ opener = urllib2.build_opener(NoDNSHTTPHandler, NullRedirectHandler, urllib2.HTTPCookieProcessor(cookie_jar))
reply = opener.open(request)
if "__filename" in cookie_jar.__dict__:
cookie_jar.save(cookie_jar.__filename, ignore_discard=True)
new_cookies = cookie_jar.make_cookies(reply, request)
else:
- reply = urllib2.urlopen(request)
+ opener = urllib2.build_opener(NoDNSHTTPHandler, NullRedirectHandler)
+ reply = opener.open(request)
length = reply.info().get("Content-Length")
if length and int(length) > max_content_size:
@@ -333,6 +345,8 @@ def http_request(address, cookie_jar=None, headers=firefox_headers):
rval = (E_TIMEOUT, None, [], "", e.__class__.__name__+str(e))
except SlowXferException, e:
rval = (E_SLOWXFER, None, [], "", e.__class__.__name__+str(e))
+ except RedirectException, e:
+ rval = (e.code, None, [], "", e.new_url)
except httplib.BadStatusLine, e:
plog('NOTICE', "HTTP Error during request of "+address+": "+str(e))
if not e.line:
@@ -523,6 +537,9 @@ class Test:
return False
return True
+ def add_target(self, target):
+ self.targets.append(target)
+
def remove_target(self, target, reason="None"):
self.banned_targets.add(target)
self.refill_targets()
@@ -971,6 +988,14 @@ class BaseHTTPTest(Test):
except IOError:
(code, resp_headers, new_cookies, mime_type, content) = http_request(address, self.cookie_jar, self.headers)
+ if code - (code % 100) == 300: # Redirection
+ plog("NOTICE", "Non-Tor HTTP "+str(code)+" redirect from "+str(address)+" to "+str(content))
+ self.remove_target(address, INCONCLUSIVE_REDIRECT)
+ self.add_target(content)
+ self.cookie_jar = orig_cookie_jar
+ self.tor_cookie_jar = orig_cookie_jar
+ return TEST_INCONCLUSIVE
+
if code - (code % 100) != 200:
plog("NOTICE", "Non-tor HTTP error "+str(code)+" fetching content for "+address)
# Just remove it
@@ -1046,10 +1071,17 @@ class BaseHTTPTest(Test):
BindingSocket.bind_to = None
if code_new == pcode:
- plog("NOTICE", "Non-tor HTTP error "+str(code_new)+" fetching content for "+address)
- # Just remove it
- self.remove_target(address, FALSEPOSITIVE_HTTPERRORS)
- return TEST_INCONCLUSIVE
+ if pcode - (pcode % 100) == 300:
+ plog("NOTICE", "Non-Tor HTTP "+str(code_new)+" redirect from "+address+" to "+str(content_new))
+ # Remove the original URL and add the redirect to our targets (if it's of the right type)
+ self.remove_target(address, INCONCLUSIVE_REDIRECT)
+ self.add_target(content)
+ return TEST_INCONCLUSIVE
+ else:
+ plog("NOTICE", "Non-tor HTTP error "+str(code_new)+" fetching content for "+address)
+ # Just remove it
+ self.remove_target(address, FALSEPOSITIVE_HTTPERRORS)
+ return TEST_INCONCLUSIVE
if pcode < 0 and type(pcode) == float:
if pcode == E_SOCKS: # "General socks error"
@@ -1091,6 +1123,14 @@ class BaseHTTPTest(Test):
fail_reason = FAILURE_URLERROR
else:
fail_reason = FAILURE_MISCEXCEPTION
+ elif pcode - (pcode % 100) == 300:
+ plog("NOTICE", "Tor only HTTP "+str(pcode)+" redirect from "+address+" to "+str(pcontent))
+ fail_reason = FAILURE_REDIRECT
+ result = HttpTestResult(self.node_map[exit_node[1:]],
+ address, TEST_FAILURE, fail_reason)
+ result.extra_info = str(pcontent)
+ self.register_exit_failure(result)
+ return TEST_FAILURE
else:
fail_reason = FAILURE_BADHTTPCODE+str(pcode)
result = HttpTestResult(self.node_map[exit_node[1:]],
@@ -1857,6 +1897,9 @@ class FixedTargetTest:
def __init__(self, targets):
self.fixed_targets = targets
+ def add_target(self, target):
+ pass
+
def refill_targets(self):
pass
@@ -2757,11 +2800,6 @@ def int2bin(n):
n = n >> 1
return bin[::-1]
-
-class NoURLsFound(Exception):
- pass
-
-
def cleanup(c, l, f):
plog("INFO", "Resetting __LeaveStreamsUnattached=0 and FetchUselessDescriptors="+f)
try:
--
1.7.1