1import errno 2import sys 3import re 4try: 5 import httplib 6except ImportError: # pragma: no cover 7 import http.client as httplib 8from webob.compat import url_quote 9import socket 10from webob import exc 11from webob.compat import PY3 12 13 14__all__ = ['send_request_app', 'SendRequest'] 15 16class SendRequest: 17 """ 18 Sends the request, as described by the environ, over actual HTTP. 19 All controls about how it is sent are contained in the request 20 environ itself. 21 22 This connects to the server given in SERVER_NAME:SERVER_PORT, and 23 sends the Host header in HTTP_HOST -- they do not have to match. 24 You can send requests to servers despite what DNS says. 25 26 Set ``environ['webob.client.timeout'] = 10`` to set the timeout on 27 the request (to, for example, 10 seconds). 28 29 Does not add X-Forwarded-For or other standard headers 30 31 If you use ``send_request_app`` then simple ``httplib`` 32 connections will be used. 33 """ 34 35 def __init__(self, HTTPConnection=httplib.HTTPConnection, 36 HTTPSConnection=httplib.HTTPSConnection): 37 self.HTTPConnection = HTTPConnection 38 self.HTTPSConnection = HTTPSConnection 39 40 def __call__(self, environ, start_response): 41 scheme = environ['wsgi.url_scheme'] 42 if scheme == 'http': 43 ConnClass = self.HTTPConnection 44 elif scheme == 'https': 45 ConnClass = self.HTTPSConnection 46 else: 47 raise ValueError( 48 "Unknown scheme: %r" % scheme) 49 if 'SERVER_NAME' not in environ: 50 host = environ.get('HTTP_HOST') 51 if not host: 52 raise ValueError( 53 "environ contains neither SERVER_NAME nor HTTP_HOST") 54 if ':' in host: 55 host, port = host.split(':', 1) 56 else: 57 if scheme == 'http': 58 port = '80' 59 else: 60 port = '443' 61 environ['SERVER_NAME'] = host 62 environ['SERVER_PORT'] = port 63 kw = {} 64 if ('webob.client.timeout' in environ and 65 self._timeout_supported(ConnClass) ): 66 kw['timeout'] = environ['webob.client.timeout'] 67 conn = ConnClass('%(SERVER_NAME)s:%(SERVER_PORT)s' % environ, **kw) 68 headers = {} 69 for key, value in environ.items(): 70 if key.startswith('HTTP_'): 71 key = key[5:].replace('_', '-').title() 72 headers[key] = value 73 path = (url_quote(environ.get('SCRIPT_NAME', '')) 74 + url_quote(environ.get('PATH_INFO', ''))) 75 if environ.get('QUERY_STRING'): 76 path += '?' + environ['QUERY_STRING'] 77 try: 78 content_length = int(environ.get('CONTENT_LENGTH', '0')) 79 except ValueError: 80 content_length = 0 81 ## FIXME: there is no streaming of the body, and that might be useful 82 ## in some cases 83 if content_length: 84 body = environ['wsgi.input'].read(content_length) 85 else: 86 body = '' 87 headers['Content-Length'] = content_length 88 if environ.get('CONTENT_TYPE'): 89 headers['Content-Type'] = environ['CONTENT_TYPE'] 90 if not path.startswith("/"): 91 path = "/" + path 92 try: 93 conn.request(environ['REQUEST_METHOD'], 94 path, body, headers) 95 res = conn.getresponse() 96 except socket.timeout: 97 resp = exc.HTTPGatewayTimeout() 98 return resp(environ, start_response) 99 except (socket.error, socket.gaierror) as e: 100 if ((isinstance(e, socket.error) and e.args[0] == -2) or 101 (isinstance(e, socket.gaierror) and e.args[0] == 8)): 102 # Name or service not known 103 resp = exc.HTTPBadGateway( 104 "Name or service not known (bad domain name: %s)" 105 % environ['SERVER_NAME']) 106 return resp(environ, start_response) 107 elif e.args[0] in _e_refused: # pragma: no cover 108 # Connection refused 109 resp = exc.HTTPBadGateway("Connection refused") 110 return resp(environ, start_response) 111 raise 112 headers_out = self.parse_headers(res.msg) 113 status = '%s %s' % (res.status, res.reason) 114 start_response(status, headers_out) 115 length = res.getheader('content-length') 116 # FIXME: This shouldn't really read in all the content at once 117 if length is not None: 118 body = res.read(int(length)) 119 else: 120 body = res.read() 121 conn.close() 122 return [body] 123 124 # Remove these headers from response (specify lower case header 125 # names): 126 filtered_headers = ( 127 'transfer-encoding', 128 ) 129 130 MULTILINE_RE = re.compile(r'\r?\n\s*') 131 132 def parse_headers(self, message): 133 """ 134 Turn a Message object into a list of WSGI-style headers. 135 """ 136 headers_out = [] 137 if PY3: # pragma: no cover 138 headers = message._headers 139 else: # pragma: no cover 140 headers = message.headers 141 for full_header in headers: 142 if not full_header: # pragma: no cover 143 # Shouldn't happen, but we'll just ignore 144 continue 145 if full_header[0].isspace(): # pragma: no cover 146 # Continuation line, add to the last header 147 if not headers_out: 148 raise ValueError( 149 "First header starts with a space (%r)" % full_header) 150 last_header, last_value = headers_out.pop() 151 value = last_value + ', ' + full_header.strip() 152 headers_out.append((last_header, value)) 153 continue 154 if isinstance(full_header, tuple): # pragma: no cover 155 header, value = full_header 156 else: # pragma: no cover 157 try: 158 header, value = full_header.split(':', 1) 159 except: 160 raise ValueError("Invalid header: %r" % (full_header,)) 161 value = value.strip() 162 if '\n' in value or '\r\n' in value: # pragma: no cover 163 # Python 3 has multiline values for continuations, Python 2 164 # has two items in headers 165 value = self.MULTILINE_RE.sub(', ', value) 166 if header.lower() not in self.filtered_headers: 167 headers_out.append((header, value)) 168 return headers_out 169 170 def _timeout_supported(self, ConnClass): 171 if sys.version_info < (2, 7) and ConnClass in ( 172 httplib.HTTPConnection, httplib.HTTPSConnection): # pragma: no cover 173 return False 174 return True 175 176 177send_request_app = SendRequest() 178 179_e_refused = (errno.ECONNREFUSED,) 180if hasattr(errno, 'ENODATA'): # pragma: no cover 181 _e_refused += (errno.ENODATA,) 182