pyopenssl.py 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509
  1. """
  2. TLS with SNI_-support for Python 2. Follow these instructions if you would
  3. like to verify TLS certificates in Python 2. Note, the default libraries do
  4. *not* do certificate checking; you need to do additional work to validate
  5. certificates yourself.
  6. This needs the following packages installed:
  7. * `pyOpenSSL`_ (tested with 16.0.0)
  8. * `cryptography`_ (minimum 1.3.4, from pyopenssl)
  9. * `idna`_ (minimum 2.0, from cryptography)
  10. However, pyopenssl depends on cryptography, which depends on idna, so while we
  11. use all three directly here we end up having relatively few packages required.
  12. You can install them with the following command:
  13. .. code-block:: bash
  14. $ python -m pip install pyopenssl cryptography idna
  15. To activate certificate checking, call
  16. :func:`~urllib3.contrib.pyopenssl.inject_into_urllib3` from your Python code
  17. before you begin making HTTP requests. This can be done in a ``sitecustomize``
  18. module, or at any other time before your application begins using ``urllib3``,
  19. like this:
  20. .. code-block:: python
  21. try:
  22. import urllib3.contrib.pyopenssl
  23. urllib3.contrib.pyopenssl.inject_into_urllib3()
  24. except ImportError:
  25. pass
  26. Now you can use :mod:`urllib3` as you normally would, and it will support SNI
  27. when the required modules are installed.
  28. Activating this module also has the positive side effect of disabling SSL/TLS
  29. compression in Python 2 (see `CRIME attack`_).
  30. .. _sni: https://en.wikipedia.org/wiki/Server_Name_Indication
  31. .. _crime attack: https://en.wikipedia.org/wiki/CRIME_(security_exploit)
  32. .. _pyopenssl: https://www.pyopenssl.org
  33. .. _cryptography: https://cryptography.io
  34. .. _idna: https://github.com/kjd/idna
  35. """
  36. from __future__ import absolute_import
  37. import OpenSSL.SSL
  38. from cryptography import x509
  39. from cryptography.hazmat.backends.openssl import backend as openssl_backend
  40. from cryptography.hazmat.backends.openssl.x509 import _Certificate
  41. try:
  42. from cryptography.x509 import UnsupportedExtension
  43. except ImportError:
  44. # UnsupportedExtension is gone in cryptography >= 2.1.0
  45. class UnsupportedExtension(Exception):
  46. pass
  47. from io import BytesIO
  48. from socket import error as SocketError
  49. from socket import timeout
  50. try: # Platform-specific: Python 2
  51. from socket import _fileobject
  52. except ImportError: # Platform-specific: Python 3
  53. _fileobject = None
  54. from ..packages.backports.makefile import backport_makefile
  55. import logging
  56. import ssl
  57. import sys
  58. from .. import util
  59. from ..packages import six
  60. __all__ = ["inject_into_urllib3", "extract_from_urllib3"]
  61. # SNI always works.
  62. HAS_SNI = True
  63. # Map from urllib3 to PyOpenSSL compatible parameter-values.
  64. _openssl_versions = {
  65. util.PROTOCOL_TLS: OpenSSL.SSL.SSLv23_METHOD,
  66. ssl.PROTOCOL_TLSv1: OpenSSL.SSL.TLSv1_METHOD,
  67. }
  68. if hasattr(ssl, "PROTOCOL_SSLv3") and hasattr(OpenSSL.SSL, "SSLv3_METHOD"):
  69. _openssl_versions[ssl.PROTOCOL_SSLv3] = OpenSSL.SSL.SSLv3_METHOD
  70. if hasattr(ssl, "PROTOCOL_TLSv1_1") and hasattr(OpenSSL.SSL, "TLSv1_1_METHOD"):
  71. _openssl_versions[ssl.PROTOCOL_TLSv1_1] = OpenSSL.SSL.TLSv1_1_METHOD
  72. if hasattr(ssl, "PROTOCOL_TLSv1_2") and hasattr(OpenSSL.SSL, "TLSv1_2_METHOD"):
  73. _openssl_versions[ssl.PROTOCOL_TLSv1_2] = OpenSSL.SSL.TLSv1_2_METHOD
  74. _stdlib_to_openssl_verify = {
  75. ssl.CERT_NONE: OpenSSL.SSL.VERIFY_NONE,
  76. ssl.CERT_OPTIONAL: OpenSSL.SSL.VERIFY_PEER,
  77. ssl.CERT_REQUIRED: OpenSSL.SSL.VERIFY_PEER
  78. + OpenSSL.SSL.VERIFY_FAIL_IF_NO_PEER_CERT,
  79. }
  80. _openssl_to_stdlib_verify = dict((v, k) for k, v in _stdlib_to_openssl_verify.items())
  81. # OpenSSL will only write 16K at a time
  82. SSL_WRITE_BLOCKSIZE = 16384
  83. orig_util_HAS_SNI = util.HAS_SNI
  84. orig_util_SSLContext = util.ssl_.SSLContext
  85. log = logging.getLogger(__name__)
  86. def inject_into_urllib3():
  87. "Monkey-patch urllib3 with PyOpenSSL-backed SSL-support."
  88. _validate_dependencies_met()
  89. util.SSLContext = PyOpenSSLContext
  90. util.ssl_.SSLContext = PyOpenSSLContext
  91. util.HAS_SNI = HAS_SNI
  92. util.ssl_.HAS_SNI = HAS_SNI
  93. util.IS_PYOPENSSL = True
  94. util.ssl_.IS_PYOPENSSL = True
  95. def extract_from_urllib3():
  96. "Undo monkey-patching by :func:`inject_into_urllib3`."
  97. util.SSLContext = orig_util_SSLContext
  98. util.ssl_.SSLContext = orig_util_SSLContext
  99. util.HAS_SNI = orig_util_HAS_SNI
  100. util.ssl_.HAS_SNI = orig_util_HAS_SNI
  101. util.IS_PYOPENSSL = False
  102. util.ssl_.IS_PYOPENSSL = False
  103. def _validate_dependencies_met():
  104. """
  105. Verifies that PyOpenSSL's package-level dependencies have been met.
  106. Throws `ImportError` if they are not met.
  107. """
  108. # Method added in `cryptography==1.1`; not available in older versions
  109. from cryptography.x509.extensions import Extensions
  110. if getattr(Extensions, "get_extension_for_class", None) is None:
  111. raise ImportError(
  112. "'cryptography' module missing required functionality. "
  113. "Try upgrading to v1.3.4 or newer."
  114. )
  115. # pyOpenSSL 0.14 and above use cryptography for OpenSSL bindings. The _x509
  116. # attribute is only present on those versions.
  117. from OpenSSL.crypto import X509
  118. x509 = X509()
  119. if getattr(x509, "_x509", None) is None:
  120. raise ImportError(
  121. "'pyOpenSSL' module missing required functionality. "
  122. "Try upgrading to v0.14 or newer."
  123. )
  124. def _dnsname_to_stdlib(name):
  125. """
  126. Converts a dNSName SubjectAlternativeName field to the form used by the
  127. standard library on the given Python version.
  128. Cryptography produces a dNSName as a unicode string that was idna-decoded
  129. from ASCII bytes. We need to idna-encode that string to get it back, and
  130. then on Python 3 we also need to convert to unicode via UTF-8 (the stdlib
  131. uses PyUnicode_FromStringAndSize on it, which decodes via UTF-8).
  132. If the name cannot be idna-encoded then we return None signalling that
  133. the name given should be skipped.
  134. """
  135. def idna_encode(name):
  136. """
  137. Borrowed wholesale from the Python Cryptography Project. It turns out
  138. that we can't just safely call `idna.encode`: it can explode for
  139. wildcard names. This avoids that problem.
  140. """
  141. from pip._vendor import idna
  142. try:
  143. for prefix in [u"*.", u"."]:
  144. if name.startswith(prefix):
  145. name = name[len(prefix) :]
  146. return prefix.encode("ascii") + idna.encode(name)
  147. return idna.encode(name)
  148. except idna.core.IDNAError:
  149. return None
  150. # Don't send IPv6 addresses through the IDNA encoder.
  151. if ":" in name:
  152. return name
  153. name = idna_encode(name)
  154. if name is None:
  155. return None
  156. elif sys.version_info >= (3, 0):
  157. name = name.decode("utf-8")
  158. return name
  159. def get_subj_alt_name(peer_cert):
  160. """
  161. Given an PyOpenSSL certificate, provides all the subject alternative names.
  162. """
  163. # Pass the cert to cryptography, which has much better APIs for this.
  164. if hasattr(peer_cert, "to_cryptography"):
  165. cert = peer_cert.to_cryptography()
  166. else:
  167. # This is technically using private APIs, but should work across all
  168. # relevant versions before PyOpenSSL got a proper API for this.
  169. cert = _Certificate(openssl_backend, peer_cert._x509)
  170. # We want to find the SAN extension. Ask Cryptography to locate it (it's
  171. # faster than looping in Python)
  172. try:
  173. ext = cert.extensions.get_extension_for_class(x509.SubjectAlternativeName).value
  174. except x509.ExtensionNotFound:
  175. # No such extension, return the empty list.
  176. return []
  177. except (
  178. x509.DuplicateExtension,
  179. UnsupportedExtension,
  180. x509.UnsupportedGeneralNameType,
  181. UnicodeError,
  182. ) as e:
  183. # A problem has been found with the quality of the certificate. Assume
  184. # no SAN field is present.
  185. log.warning(
  186. "A problem was encountered with the certificate that prevented "
  187. "urllib3 from finding the SubjectAlternativeName field. This can "
  188. "affect certificate validation. The error was %s",
  189. e,
  190. )
  191. return []
  192. # We want to return dNSName and iPAddress fields. We need to cast the IPs
  193. # back to strings because the match_hostname function wants them as
  194. # strings.
  195. # Sadly the DNS names need to be idna encoded and then, on Python 3, UTF-8
  196. # decoded. This is pretty frustrating, but that's what the standard library
  197. # does with certificates, and so we need to attempt to do the same.
  198. # We also want to skip over names which cannot be idna encoded.
  199. names = [
  200. ("DNS", name)
  201. for name in map(_dnsname_to_stdlib, ext.get_values_for_type(x509.DNSName))
  202. if name is not None
  203. ]
  204. names.extend(
  205. ("IP Address", str(name)) for name in ext.get_values_for_type(x509.IPAddress)
  206. )
  207. return names
  208. class WrappedSocket(object):
  209. """API-compatibility wrapper for Python OpenSSL's Connection-class.
  210. Note: _makefile_refs, _drop() and _reuse() are needed for the garbage
  211. collector of pypy.
  212. """
  213. def __init__(self, connection, socket, suppress_ragged_eofs=True):
  214. self.connection = connection
  215. self.socket = socket
  216. self.suppress_ragged_eofs = suppress_ragged_eofs
  217. self._makefile_refs = 0
  218. self._closed = False
  219. def fileno(self):
  220. return self.socket.fileno()
  221. # Copy-pasted from Python 3.5 source code
  222. def _decref_socketios(self):
  223. if self._makefile_refs > 0:
  224. self._makefile_refs -= 1
  225. if self._closed:
  226. self.close()
  227. def recv(self, *args, **kwargs):
  228. try:
  229. data = self.connection.recv(*args, **kwargs)
  230. except OpenSSL.SSL.SysCallError as e:
  231. if self.suppress_ragged_eofs and e.args == (-1, "Unexpected EOF"):
  232. return b""
  233. else:
  234. raise SocketError(str(e))
  235. except OpenSSL.SSL.ZeroReturnError:
  236. if self.connection.get_shutdown() == OpenSSL.SSL.RECEIVED_SHUTDOWN:
  237. return b""
  238. else:
  239. raise
  240. except OpenSSL.SSL.WantReadError:
  241. if not util.wait_for_read(self.socket, self.socket.gettimeout()):
  242. raise timeout("The read operation timed out")
  243. else:
  244. return self.recv(*args, **kwargs)
  245. # TLS 1.3 post-handshake authentication
  246. except OpenSSL.SSL.Error as e:
  247. raise ssl.SSLError("read error: %r" % e)
  248. else:
  249. return data
  250. def recv_into(self, *args, **kwargs):
  251. try:
  252. return self.connection.recv_into(*args, **kwargs)
  253. except OpenSSL.SSL.SysCallError as e:
  254. if self.suppress_ragged_eofs and e.args == (-1, "Unexpected EOF"):
  255. return 0
  256. else:
  257. raise SocketError(str(e))
  258. except OpenSSL.SSL.ZeroReturnError:
  259. if self.connection.get_shutdown() == OpenSSL.SSL.RECEIVED_SHUTDOWN:
  260. return 0
  261. else:
  262. raise
  263. except OpenSSL.SSL.WantReadError:
  264. if not util.wait_for_read(self.socket, self.socket.gettimeout()):
  265. raise timeout("The read operation timed out")
  266. else:
  267. return self.recv_into(*args, **kwargs)
  268. # TLS 1.3 post-handshake authentication
  269. except OpenSSL.SSL.Error as e:
  270. raise ssl.SSLError("read error: %r" % e)
  271. def settimeout(self, timeout):
  272. return self.socket.settimeout(timeout)
  273. def _send_until_done(self, data):
  274. while True:
  275. try:
  276. return self.connection.send(data)
  277. except OpenSSL.SSL.WantWriteError:
  278. if not util.wait_for_write(self.socket, self.socket.gettimeout()):
  279. raise timeout()
  280. continue
  281. except OpenSSL.SSL.SysCallError as e:
  282. raise SocketError(str(e))
  283. def sendall(self, data):
  284. total_sent = 0
  285. while total_sent < len(data):
  286. sent = self._send_until_done(
  287. data[total_sent : total_sent + SSL_WRITE_BLOCKSIZE]
  288. )
  289. total_sent += sent
  290. def shutdown(self):
  291. # FIXME rethrow compatible exceptions should we ever use this
  292. self.connection.shutdown()
  293. def close(self):
  294. if self._makefile_refs < 1:
  295. try:
  296. self._closed = True
  297. return self.connection.close()
  298. except OpenSSL.SSL.Error:
  299. return
  300. else:
  301. self._makefile_refs -= 1
  302. def getpeercert(self, binary_form=False):
  303. x509 = self.connection.get_peer_certificate()
  304. if not x509:
  305. return x509
  306. if binary_form:
  307. return OpenSSL.crypto.dump_certificate(OpenSSL.crypto.FILETYPE_ASN1, x509)
  308. return {
  309. "subject": ((("commonName", x509.get_subject().CN),),),
  310. "subjectAltName": get_subj_alt_name(x509),
  311. }
  312. def version(self):
  313. return self.connection.get_protocol_version_name()
  314. def _reuse(self):
  315. self._makefile_refs += 1
  316. def _drop(self):
  317. if self._makefile_refs < 1:
  318. self.close()
  319. else:
  320. self._makefile_refs -= 1
  321. if _fileobject: # Platform-specific: Python 2
  322. def makefile(self, mode, bufsize=-1):
  323. self._makefile_refs += 1
  324. return _fileobject(self, mode, bufsize, close=True)
  325. else: # Platform-specific: Python 3
  326. makefile = backport_makefile
  327. WrappedSocket.makefile = makefile
  328. class PyOpenSSLContext(object):
  329. """
  330. I am a wrapper class for the PyOpenSSL ``Context`` object. I am responsible
  331. for translating the interface of the standard library ``SSLContext`` object
  332. to calls into PyOpenSSL.
  333. """
  334. def __init__(self, protocol):
  335. self.protocol = _openssl_versions[protocol]
  336. self._ctx = OpenSSL.SSL.Context(self.protocol)
  337. self._options = 0
  338. self.check_hostname = False
  339. @property
  340. def options(self):
  341. return self._options
  342. @options.setter
  343. def options(self, value):
  344. self._options = value
  345. self._ctx.set_options(value)
  346. @property
  347. def verify_mode(self):
  348. return _openssl_to_stdlib_verify[self._ctx.get_verify_mode()]
  349. @verify_mode.setter
  350. def verify_mode(self, value):
  351. self._ctx.set_verify(_stdlib_to_openssl_verify[value], _verify_callback)
  352. def set_default_verify_paths(self):
  353. self._ctx.set_default_verify_paths()
  354. def set_ciphers(self, ciphers):
  355. if isinstance(ciphers, six.text_type):
  356. ciphers = ciphers.encode("utf-8")
  357. self._ctx.set_cipher_list(ciphers)
  358. def load_verify_locations(self, cafile=None, capath=None, cadata=None):
  359. if cafile is not None:
  360. cafile = cafile.encode("utf-8")
  361. if capath is not None:
  362. capath = capath.encode("utf-8")
  363. try:
  364. self._ctx.load_verify_locations(cafile, capath)
  365. if cadata is not None:
  366. self._ctx.load_verify_locations(BytesIO(cadata))
  367. except OpenSSL.SSL.Error as e:
  368. raise ssl.SSLError("unable to load trusted certificates: %r" % e)
  369. def load_cert_chain(self, certfile, keyfile=None, password=None):
  370. self._ctx.use_certificate_chain_file(certfile)
  371. if password is not None:
  372. if not isinstance(password, six.binary_type):
  373. password = password.encode("utf-8")
  374. self._ctx.set_passwd_cb(lambda *_: password)
  375. self._ctx.use_privatekey_file(keyfile or certfile)
  376. def set_alpn_protocols(self, protocols):
  377. protocols = [six.ensure_binary(p) for p in protocols]
  378. return self._ctx.set_alpn_protos(protocols)
  379. def wrap_socket(
  380. self,
  381. sock,
  382. server_side=False,
  383. do_handshake_on_connect=True,
  384. suppress_ragged_eofs=True,
  385. server_hostname=None,
  386. ):
  387. cnx = OpenSSL.SSL.Connection(self._ctx, sock)
  388. if isinstance(server_hostname, six.text_type): # Platform-specific: Python 3
  389. server_hostname = server_hostname.encode("utf-8")
  390. if server_hostname is not None:
  391. cnx.set_tlsext_host_name(server_hostname)
  392. cnx.set_connect_state()
  393. while True:
  394. try:
  395. cnx.do_handshake()
  396. except OpenSSL.SSL.WantReadError:
  397. if not util.wait_for_read(sock, sock.gettimeout()):
  398. raise timeout("select timed out")
  399. continue
  400. except OpenSSL.SSL.Error as e:
  401. raise ssl.SSLError("bad handshake: %r" % e)
  402. break
  403. return WrappedSocket(cnx, sock)
  404. def _verify_callback(cnx, x509, err_no, err_depth, return_code):
  405. return err_no == 0