Mark Slee | 89e2bb8 | 2007-03-01 00:20:36 +0000 | [diff] [blame] | 1 | # |
David Reiss | ea2cba8 | 2009-03-30 21:35:00 +0000 | [diff] [blame] | 2 | # Licensed to the Apache Software Foundation (ASF) under one |
| 3 | # or more contributor license agreements. See the NOTICE file |
| 4 | # distributed with this work for additional information |
| 5 | # regarding copyright ownership. The ASF licenses this file |
| 6 | # to you under the Apache License, Version 2.0 (the |
| 7 | # "License"); you may not use this file except in compliance |
| 8 | # with the License. You may obtain a copy of the License at |
| 9 | # |
| 10 | # http://www.apache.org/licenses/LICENSE-2.0 |
| 11 | # |
| 12 | # Unless required by applicable law or agreed to in writing, |
| 13 | # software distributed under the License is distributed on an |
| 14 | # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| 15 | # KIND, either express or implied. See the License for the |
| 16 | # specific language governing permissions and limitations |
| 17 | # under the License. |
| 18 | # |
Mark Slee | 89e2bb8 | 2007-03-01 00:20:36 +0000 | [diff] [blame] | 19 | |
Nobuaki Sukegawa | 760511f | 2015-11-06 21:24:16 +0900 | [diff] [blame] | 20 | from io import BytesIO |
Roger Meier | 3f5a264 | 2012-04-13 14:20:08 +0000 | [diff] [blame] | 21 | import os |
James E. King III | 6f8c99e | 2018-03-24 16:32:02 -0400 | [diff] [blame] | 22 | import ssl |
Roger Meier | 3f5a264 | 2012-04-13 14:20:08 +0000 | [diff] [blame] | 23 | import sys |
Bryan Duxbury | 6972041 | 2012-01-03 17:32:30 +0000 | [diff] [blame] | 24 | import warnings |
Martin Wilck | 1ac0a80 | 2016-04-27 09:41:03 +0200 | [diff] [blame] | 25 | import base64 |
Bryan Duxbury | 6972041 | 2012-01-03 17:32:30 +0000 | [diff] [blame] | 26 | |
Nobuaki Sukegawa | 760511f | 2015-11-06 21:24:16 +0900 | [diff] [blame] | 27 | from six.moves import urllib |
| 28 | from six.moves import http_client |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 29 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 30 | from .TTransport import TTransportBase |
Nobuaki Sukegawa | 760511f | 2015-11-06 21:24:16 +0900 | [diff] [blame] | 31 | import six |
Bryan Duxbury | 6972041 | 2012-01-03 17:32:30 +0000 | [diff] [blame] | 32 | |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 33 | |
| 34 | class THttpClient(TTransportBase): |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 35 | """Http implementation of TTransport base.""" |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 36 | |
James E. King III | 6f8c99e | 2018-03-24 16:32:02 -0400 | [diff] [blame] | 37 | def __init__(self, uri_or_host, port=None, path=None, cafile=None, cert_file=None, key_file=None, ssl_context=None): |
| 38 | """THttpClient supports two different types of construction: |
David Reiss | 2aa2890 | 2009-03-26 06:22:18 +0000 | [diff] [blame] | 39 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 40 | THttpClient(host, port, path) - deprecated |
James E. King III | 6f8c99e | 2018-03-24 16:32:02 -0400 | [diff] [blame] | 41 | THttpClient(uri, [port=<n>, path=<s>, cafile=<filename>, cert_file=<filename>, key_file=<filename>, ssl_context=<context>]) |
David Reiss | 2aa2890 | 2009-03-26 06:22:18 +0000 | [diff] [blame] | 42 | |
James E. King III | 6f8c99e | 2018-03-24 16:32:02 -0400 | [diff] [blame] | 43 | Only the second supports https. To properly authenticate against the server, |
| 44 | provide the client's identity by specifying cert_file and key_file. To properly |
| 45 | authenticate the server, specify either cafile or ssl_context with a CA defined. |
| 46 | NOTE: if both cafile and ssl_context are defined, ssl_context will override cafile. |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 47 | """ |
| 48 | if port is not None: |
| 49 | warnings.warn( |
James E. King III | 6f8c99e | 2018-03-24 16:32:02 -0400 | [diff] [blame] | 50 | "Please use the THttpClient('http{s}://host:port/path') constructor", |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 51 | DeprecationWarning, |
| 52 | stacklevel=2) |
| 53 | self.host = uri_or_host |
| 54 | self.port = port |
| 55 | assert path |
| 56 | self.path = path |
| 57 | self.scheme = 'http' |
| 58 | else: |
| 59 | parsed = urllib.parse.urlparse(uri_or_host) |
| 60 | self.scheme = parsed.scheme |
| 61 | assert self.scheme in ('http', 'https') |
| 62 | if self.scheme == 'http': |
| 63 | self.port = parsed.port or http_client.HTTP_PORT |
| 64 | elif self.scheme == 'https': |
| 65 | self.port = parsed.port or http_client.HTTPS_PORT |
James E. King III | 6f8c99e | 2018-03-24 16:32:02 -0400 | [diff] [blame] | 66 | self.certfile = cert_file |
| 67 | self.keyfile = key_file |
| 68 | self.context = ssl.create_default_context(cafile=cafile) if (cafile and not ssl_context) else ssl_context |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 69 | self.host = parsed.hostname |
| 70 | self.path = parsed.path |
| 71 | if parsed.query: |
| 72 | self.path += '?%s' % parsed.query |
Martin Wilck | 1ac0a80 | 2016-04-27 09:41:03 +0200 | [diff] [blame] | 73 | try: |
| 74 | proxy = urllib.request.getproxies()[self.scheme] |
| 75 | except KeyError: |
| 76 | proxy = None |
| 77 | else: |
| 78 | if urllib.request.proxy_bypass(self.host): |
| 79 | proxy = None |
| 80 | if proxy: |
| 81 | parsed = urllib.parse.urlparse(proxy) |
| 82 | self.realhost = self.host |
| 83 | self.realport = self.port |
| 84 | self.host = parsed.hostname |
| 85 | self.port = parsed.port |
| 86 | self.proxy_auth = self.basic_proxy_auth_header(parsed) |
| 87 | else: |
| 88 | self.realhost = self.realport = self.proxy_auth = None |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 89 | self.__wbuf = BytesIO() |
| 90 | self.__http = None |
| 91 | self.__http_response = None |
| 92 | self.__timeout = None |
| 93 | self.__custom_headers = None |
Márton Csordás | 103a11c | 2021-12-16 10:08:11 +0100 | [diff] [blame] | 94 | self.headers = None |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 95 | |
Martin Wilck | 1ac0a80 | 2016-04-27 09:41:03 +0200 | [diff] [blame] | 96 | @staticmethod |
| 97 | def basic_proxy_auth_header(proxy): |
| 98 | if proxy is None or not proxy.username: |
| 99 | return None |
| 100 | ap = "%s:%s" % (urllib.parse.unquote(proxy.username), |
| 101 | urllib.parse.unquote(proxy.password)) |
くらげ | bf09675 | 2021-07-25 23:46:42 +0900 | [diff] [blame] | 102 | cr = base64.b64encode(ap.encode()).strip() |
Martin Wilck | 1ac0a80 | 2016-04-27 09:41:03 +0200 | [diff] [blame] | 103 | return "Basic " + cr |
| 104 | |
| 105 | def using_proxy(self): |
| 106 | return self.realhost is not None |
| 107 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 108 | def open(self): |
| 109 | if self.scheme == 'http': |
James E. King III | 6f8c99e | 2018-03-24 16:32:02 -0400 | [diff] [blame] | 110 | self.__http = http_client.HTTPConnection(self.host, self.port, |
| 111 | timeout=self.__timeout) |
Martin Wilck | 1ac0a80 | 2016-04-27 09:41:03 +0200 | [diff] [blame] | 112 | elif self.scheme == 'https': |
James E. King III | 6f8c99e | 2018-03-24 16:32:02 -0400 | [diff] [blame] | 113 | self.__http = http_client.HTTPSConnection(self.host, self.port, |
| 114 | key_file=self.keyfile, |
| 115 | cert_file=self.certfile, |
| 116 | timeout=self.__timeout, |
| 117 | context=self.context) |
| 118 | if self.using_proxy(): |
| 119 | self.__http.set_tunnel(self.realhost, self.realport, |
| 120 | {"Proxy-Authorization": self.proxy_auth}) |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 121 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 122 | def close(self): |
| 123 | self.__http.close() |
| 124 | self.__http = None |
| 125 | self.__http_response = None |
David Reiss | 0c90f6f | 2008-02-06 22:18:40 +0000 | [diff] [blame] | 126 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 127 | def isOpen(self): |
| 128 | return self.__http is not None |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 129 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 130 | def setTimeout(self, ms): |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 131 | if ms is None: |
| 132 | self.__timeout = None |
| 133 | else: |
| 134 | self.__timeout = ms / 1000.0 |
David Reiss | ff3d249 | 2010-03-09 05:19:16 +0000 | [diff] [blame] | 135 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 136 | def setCustomHeaders(self, headers): |
| 137 | self.__custom_headers = headers |
Roger Meier | fa392e9 | 2012-04-11 22:15:15 +0000 | [diff] [blame] | 138 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 139 | def read(self, sz): |
| 140 | return self.__http_response.read(sz) |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 141 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 142 | def write(self, buf): |
| 143 | self.__wbuf.write(buf) |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 144 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 145 | def flush(self): |
| 146 | if self.isOpen(): |
| 147 | self.close() |
| 148 | self.open() |
David Reiss | 7c1f6f8 | 2009-03-24 20:10:24 +0000 | [diff] [blame] | 149 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 150 | # Pull data out of buffer |
| 151 | data = self.__wbuf.getvalue() |
| 152 | self.__wbuf = BytesIO() |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 153 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 154 | # HTTP request |
Martin Wilck | 1ac0a80 | 2016-04-27 09:41:03 +0200 | [diff] [blame] | 155 | if self.using_proxy() and self.scheme == "http": |
| 156 | # need full URL of real host for HTTP proxy here (HTTPS uses CONNECT tunnel) |
| 157 | self.__http.putrequest('POST', "http://%s:%s%s" % |
| 158 | (self.realhost, self.realport, self.path)) |
| 159 | else: |
| 160 | self.__http.putrequest('POST', self.path) |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 161 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 162 | # Write headers |
| 163 | self.__http.putheader('Content-Type', 'application/x-thrift') |
| 164 | self.__http.putheader('Content-Length', str(len(data))) |
Martin Wilck | 1ac0a80 | 2016-04-27 09:41:03 +0200 | [diff] [blame] | 165 | if self.using_proxy() and self.scheme == "http" and self.proxy_auth is not None: |
| 166 | self.__http.putheader("Proxy-Authorization", self.proxy_auth) |
Roger Meier | fa392e9 | 2012-04-11 22:15:15 +0000 | [diff] [blame] | 167 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 168 | if not self.__custom_headers or 'User-Agent' not in self.__custom_headers: |
| 169 | user_agent = 'Python/THttpClient' |
| 170 | script = os.path.basename(sys.argv[0]) |
| 171 | if script: |
| 172 | user_agent = '%s (%s)' % (user_agent, urllib.parse.quote(script)) |
| 173 | self.__http.putheader('User-Agent', user_agent) |
Roger Meier | 3f5a264 | 2012-04-13 14:20:08 +0000 | [diff] [blame] | 174 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 175 | if self.__custom_headers: |
| 176 | for key, val in six.iteritems(self.__custom_headers): |
| 177 | self.__http.putheader(key, val) |
Roger Meier | fa392e9 | 2012-04-11 22:15:15 +0000 | [diff] [blame] | 178 | |
Márton Csordás | 103a11c | 2021-12-16 10:08:11 +0100 | [diff] [blame] | 179 | # Saves the cookie sent by the server in the previous response. |
| 180 | # HTTPConnection.putheader can only be called after a request has been |
| 181 | # started, and before it's been sent. |
| 182 | if self.headers and 'Set-Cookie' in self.headers: |
| 183 | self.__http.putheader('Cookie', self.headers['Set-Cookie']) |
| 184 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 185 | self.__http.endheaders() |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 186 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 187 | # Write payload |
| 188 | self.__http.send(data) |
Mark Slee | bd8b991 | 2007-02-27 20:17:00 +0000 | [diff] [blame] | 189 | |
Nobuaki Sukegawa | 10308cb | 2016-02-03 01:57:03 +0900 | [diff] [blame] | 190 | # Get reply to flush the request |
| 191 | self.__http_response = self.__http.getresponse() |
| 192 | self.code = self.__http_response.status |
| 193 | self.message = self.__http_response.reason |
| 194 | self.headers = self.__http_response.msg |