]> git.mxchange.org Git - quix0rs-apt-p2p.git/blobdiff - HTTPDownloader.py
Make it also work from the command-line.
[quix0rs-apt-p2p.git] / HTTPDownloader.py
index 290c7f9a8a56f0a77e3bd27025d52912fc8a6da5..7e5a06cb6880a10bcb8ce0a20c43ef56e1862ab9 100644 (file)
@@ -1,11 +1,16 @@
 
 from twisted.internet import reactor, defer, protocol
 from twisted.internet.protocol import ClientFactory
+from twisted import version as twisted_version
 from twisted.web2.client.interfaces import IHTTPClientManager
 from twisted.web2.client.http import ProtocolError, ClientRequest, HTTPClientProtocol
+from twisted.web2 import stream as stream_mod, http_headers
+from twisted.web2 import version as web2_version
 from twisted.trial import unittest
 from zope.interface import implements
 
+from apt_dht_conf import version
+
 class HTTPClientManager(ClientFactory):
     """A manager for all HTTP requests to a single site.
     
@@ -17,7 +22,7 @@ class HTTPClientManager(ClientFactory):
 
     implements(IHTTPClientManager)
     
-    def __init__(self, host, port):
+    def __init__(self, host, port=80):
         self.host = host
         self.port = port
         self.busy = False
@@ -104,23 +109,22 @@ class HTTPClientManager(ClientFactory):
         if self.request_queue:
             self.processQueue()
             
-class HTTPDownloader:
-    """Manages all the HTTP connections to various sites."""
+    def setCommonHeaders(self):
+        headers = http_headers.Headers()
+        headers.setHeader('Host', self.host)
+        headers.setHeader('User-Agent', 'apt-dht/%s (twisted/%s twisted.web2/%s)' % 
+                          (version.short(), twisted_version.short(), web2_version.short()))
+        return headers
     
-    def __init__(self):
-        self.clients = {}
+    def get(self, path, method="GET"):
+        headers = self.setCommonHeaders()
+        return self.submitRequest(ClientRequest(method, path, headers, None))
     
-    def get(self, host, port, request):
-        site = host + ":" + str(port)
-        if site not in self.clients:
-            self.clients[site] = HTTPClientManager(host, port)
-        return self.clients[site].submitRequest(request)
+    def getRange(self, path, rangeStart, rangeEnd, method="GET"):
+        headers = self.setCommonHeaders()
+        headers.setHeader('Range', ('bytes', [(rangeStart, rangeEnd)]))
+        return self.submitRequest(ClientRequest(method, path, headers, None))
     
-    def closeAll(self):
-        for site in self.clients:
-            self.clients[site].close()
-        self.clients = {}
-
 class TestClientManager(unittest.TestCase):
     """Unit tests for the HTTPClientManager."""
     
@@ -129,30 +133,31 @@ class TestClientManager(unittest.TestCase):
     
     def gotResp(self, resp, num, expect):
         self.failUnless(resp.code >= 200 and resp.code < 300, "Got a non-200 response: %r" % resp.code)
-        self.failUnless(resp.stream.length == expect, "Length was incorrect, got %r, expected %r" % (resp.stream.length, expect))
-        resp.stream.close()
+        if expect is not None:
+            self.failUnless(resp.stream.length == expect, "Length was incorrect, got %r, expected %r" % (resp.stream.length, expect))
+        def print_(n):
+            pass
+        def printdone(n):
+            pass
+        stream_mod.readStream(resp.stream, print_).addCallback(printdone)
     
     def test_download(self):
         host = 'www.camrdale.org'
         self.client = HTTPClientManager(host, 80)
         self.timeout = 10
-        lastDefer = defer.Deferred()
         
-        d = self.client.submitRequest(ClientRequest("GET", '/robots.txt', {'Host':host}, None))
+        d = self.client.get('/robots.txt')
         d.addCallback(self.gotResp, 1, 309)
-        d.addBoth(lastDefer.callback)
-        return lastDefer
+        return d
         
     def test_head(self):
         host = 'www.camrdale.org'
         self.client = HTTPClientManager(host, 80)
         self.timeout = 10
-        lastDefer = defer.Deferred()
         
-        d = self.client.submitRequest(ClientRequest("HEAD", '/robots.txt', {'Host':host}, None))
+        d = self.client.get('/robots.txt', "HEAD")
         d.addCallback(self.gotResp, 1, 0)
-        d.addBoth(lastDefer.callback)
-        return lastDefer
+        return d
         
     def test_multiple_downloads(self):
         host = 'www.camrdale.org'
@@ -161,7 +166,7 @@ class TestClientManager(unittest.TestCase):
         lastDefer = defer.Deferred()
         
         def newRequest(path, num, expect, last=False):
-            d = self.client.submitRequest(ClientRequest("GET", path, {'Host':host}, None))
+            d = self.client.get(path)
             d.addCallback(self.gotResp, num, expect)
             if last:
                 d.addCallback(lastDefer.callback)
@@ -178,99 +183,44 @@ class TestClientManager(unittest.TestCase):
         self.pending_calls.append(reactor.callLater(62, newRequest, '/sitemap2.rss', 0, 302362, True))
         return lastDefer
         
-    def test_range(self):
+    def test_multiple_quick_downloads(self):
         host = 'www.camrdale.org'
         self.client = HTTPClientManager(host, 80)
-        self.timeout = 10
-        lastDefer = defer.Deferred()
-        
-        d = self.client.submitRequest(ClientRequest("GET", '/robots.txt', {'Host':host, 'Range': ('bytes', [(100, 199)])}, None))
-        d.addCallback(self.gotResp, 1, 100)
-        d.addBoth(lastDefer.callback)
-        return lastDefer
-        
-    def tearDown(self):
-        for p in self.pending_calls:
-            if p.active():
-                p.cancel()
-        self.pending_calls = []
-        if self.client:
-            self.client.close()
-            self.client = None
-
-class TestDownloader(unittest.TestCase):
-    """Unit tests for the HTTPDownloader."""
-    
-    manager = None
-    pending_calls = []
-    
-    def gotResp(self, resp, num, expect):
-        self.failUnless(resp.code >= 200 and resp.code < 300, "Got a non-200 response: %r" % resp.code)
-        if expect is not None:
-            self.failUnless(resp.stream.length == expect, "Length was incorrect, got %r, expected %r" % (resp.stream.length, expect))
-        resp.stream.close()
-    
-    def test_download(self):
-        self.manager = HTTPDownloader()
-        self.timeout = 10
-        lastDefer = defer.Deferred()
-        
-        host = 'www.camrdale.org'
-        d = self.manager.get(host, 80, ClientRequest("GET", '/robots.txt', {'Host':host}, None))
-        d.addCallback(self.gotResp, 1, 309)
-        d.addBoth(lastDefer.callback)
-        return lastDefer
-        
-    def test_head(self):
-        self.manager = HTTPDownloader()
-        self.timeout = 10
+        self.timeout = 30
         lastDefer = defer.Deferred()
         
-        host = 'www.camrdale.org'
-        d = self.manager.get(host, 80, ClientRequest("HEAD", '/robots.txt', {'Host':host}, None))
-        d.addCallback(self.gotResp, 1, 0)
-        d.addBoth(lastDefer.callback)
-        return lastDefer
-        
-    def test_multiple_downloads(self):
-        self.manager = HTTPDownloader()
-        self.timeout = 120
-        lastDefer = defer.Deferred()
-        
-        def newRequest(host, path, num, expect, last=False):
-            d = self.manager.get(host, 80, ClientRequest("GET", path, {'Host':host}, None))
+        def newRequest(path, num, expect, last=False):
+            d = self.client.get(path)
             d.addCallback(self.gotResp, num, expect)
             if last:
                 d.addCallback(lastDefer.callback)
                 
-        newRequest('www.camrdale.org', "/", 1, 3433)
-        newRequest('www.camrdale.org', "/blog/", 2, 37121)
-        newRequest('www.google.ca', "/", 3, None)
-        self.pending_calls.append(reactor.callLater(1, newRequest, 'www.sfu.ca', '/', 4, None))
-        self.pending_calls.append(reactor.callLater(10, newRequest, 'www.camrdale.org', '/wikilink.html', 5, 3084))
-        self.pending_calls.append(reactor.callLater(30, newRequest, 'www.camrdale.org', '/sitemap.html', 6, 4750))
-        self.pending_calls.append(reactor.callLater(31, newRequest, 'www.sfu.ca', '/studentcentral/index.html', 7, None))
-        self.pending_calls.append(reactor.callLater(32, newRequest, 'www.camrdale.org', '/openid.html', 8, 2525))
-        self.pending_calls.append(reactor.callLater(32, newRequest, 'www.camrdale.org', '/subpage.html', 9, 2381))
-        self.pending_calls.append(reactor.callLater(62, newRequest, 'www.google.ca', '/intl/en/options/', 0, None, True))
+        newRequest("/", 1, 3433)
+        newRequest("/blog/", 2, 37121)
+        newRequest("/camrdale.html", 3, 2234)
+        self.pending_calls.append(reactor.callLater(0, newRequest, '/robots.txt', 4, 309))
+        self.pending_calls.append(reactor.callLater(0, newRequest, '/wikilink.html', 5, 3084))
+        self.pending_calls.append(reactor.callLater(0, newRequest, '/sitemap.html', 6, 4750))
+        self.pending_calls.append(reactor.callLater(0, newRequest, '/PlanetLab.html', 7, 2783))
+        self.pending_calls.append(reactor.callLater(0, newRequest, '/openid.html', 8, 2525))
+        self.pending_calls.append(reactor.callLater(0, newRequest, '/subpage.html', 9, 2381))
+        self.pending_calls.append(reactor.callLater(0, newRequest, '/sitemap2.rss', 0, 302362, True))
         return lastDefer
         
     def test_range(self):
-        self.manager = HTTPDownloader()
+        host = 'www.camrdale.org'
+        self.client = HTTPClientManager(host, 80)
         self.timeout = 10
-        lastDefer = defer.Deferred()
         
-        host = 'www.camrdale.org'
-        d = self.manager.get(host, 80, ClientRequest("GET", '/robots.txt', {'Host':host, 'Range': ('bytes', [(100, 199)])}, None))
+        d = self.client.getRange('/robots.txt', 100, 199)
         d.addCallback(self.gotResp, 1, 100)
-        d.addBoth(lastDefer.callback)
-        return lastDefer
+        return d
         
     def tearDown(self):
         for p in self.pending_calls:
             if p.active():
                 p.cancel()
         self.pending_calls = []
-        if self.manager:
-            self.manager.closeAll()
-            self.manager = None
+        if self.client:
+            self.client.close()
+            self.client = None