Blame SOURCES/00146-hashlib-fips.patch

98d66e
From ece76465680b0df5b3fce7bf8ff1ff0253933889 Mon Sep 17 00:00:00 2001
98d66e
From: Petr Viktorin <pviktori@redhat.com>
98d66e
Date: Mon, 2 Sep 2019 17:33:29 +0200
98d66e
Subject: [PATCH 01/11] Remove HASH_OBJ_CONSTRUCTOR
98d66e
98d66e
See https://github.com/python/cpython/commit/c7e219132aff1e21cb9ccb0a9b570dc6c750039b
98d66e
---
98d66e
 Modules/_hashopenssl.c | 59 ------------------------------------------
98d66e
 1 file changed, 59 deletions(-)
98d66e
98d66e
diff --git a/Modules/_hashopenssl.c b/Modules/_hashopenssl.c
98d66e
index 78445ebabdd3..cb81e9765251 100644
98d66e
--- a/Modules/_hashopenssl.c
98d66e
+++ b/Modules/_hashopenssl.c
98d66e
@@ -48,10 +48,6 @@
98d66e
  * to allow the user to optimize based on the platform they're using. */
98d66e
 #define HASHLIB_GIL_MINSIZE 2048
98d66e
 
98d66e
-#ifndef HASH_OBJ_CONSTRUCTOR
98d66e
-#define HASH_OBJ_CONSTRUCTOR 0
98d66e
-#endif
98d66e
-
98d66e
 #if defined(OPENSSL_VERSION_NUMBER) && (OPENSSL_VERSION_NUMBER >= 0x00908000)
98d66e
 #define _OPENSSL_SUPPORTS_SHA2
98d66e
 #endif
98d66e
@@ -384,53 +380,6 @@ EVP_repr(PyObject *self)
98d66e
     return PyString_FromString(buf);
98d66e
 }
98d66e
 
98d66e
-#if HASH_OBJ_CONSTRUCTOR
98d66e
-static int
98d66e
-EVP_tp_init(EVPobject *self, PyObject *args, PyObject *kwds)
98d66e
-{
98d66e
-    static char *kwlist[] = {"name", "string", NULL};
98d66e
-    PyObject *name_obj = NULL;
98d66e
-    Py_buffer view = { 0 };
98d66e
-    char *nameStr;
98d66e
-    const EVP_MD *digest;
98d66e
-
98d66e
-    if (!PyArg_ParseTupleAndKeywords(args, kwds, "O|s*:HASH", kwlist,
98d66e
-                                     &name_obj, &view)) {
98d66e
-        return -1;
98d66e
-    }
98d66e
-
98d66e
-    if (!PyArg_Parse(name_obj, "s", &nameStr)) {
98d66e
-        PyErr_SetString(PyExc_TypeError, "name must be a string");
98d66e
-        PyBuffer_Release(&view);
98d66e
-        return -1;
98d66e
-    }
98d66e
-
98d66e
-    digest = EVP_get_digestbyname(nameStr);
98d66e
-    if (!digest) {
98d66e
-        PyErr_SetString(PyExc_ValueError, "unknown hash function");
98d66e
-        PyBuffer_Release(&view);
98d66e
-        return -1;
98d66e
-    }
98d66e
-    EVP_DigestInit(self->ctx, digest);
98d66e
-
98d66e
-    self->name = name_obj;
98d66e
-    Py_INCREF(self->name);
98d66e
-
98d66e
-    if (view.obj) {
98d66e
-        if (view.len >= HASHLIB_GIL_MINSIZE) {
98d66e
-            Py_BEGIN_ALLOW_THREADS
98d66e
-            EVP_hash(self, view.buf, view.len);
98d66e
-            Py_END_ALLOW_THREADS
98d66e
-        } else {
98d66e
-            EVP_hash(self, view.buf, view.len);
98d66e
-        }
98d66e
-        PyBuffer_Release(&view);
98d66e
-    }
98d66e
-
98d66e
-    return 0;
98d66e
-}
98d66e
-#endif
98d66e
-
98d66e
 
98d66e
 PyDoc_STRVAR(hashtype_doc,
98d66e
 "A hash represents the object used to calculate a checksum of a\n\
98d66e
@@ -487,9 +436,6 @@ static PyTypeObject EVPtype = {
98d66e
     0,                  /* tp_descr_set */
98d66e
     0,                  /* tp_dictoffset */
98d66e
 #endif
98d66e
-#if HASH_OBJ_CONSTRUCTOR
98d66e
-    (initproc)EVP_tp_init, /* tp_init */
98d66e
-#endif
98d66e
 };
98d66e
 
98d66e
 static PyObject *
98d66e
@@ -928,11 +874,6 @@ init_hashlib(void)
98d66e
         return;
98d66e
     }
98d66e
 
98d66e
-#if HASH_OBJ_CONSTRUCTOR
98d66e
-    Py_INCREF(&EVPtype);
98d66e
-    PyModule_AddObject(m, "HASH", (PyObject *)&EVPtype);
98d66e
-#endif
98d66e
-
98d66e
     /* these constants are used by the convenience constructors */
98d66e
     INIT_CONSTRUCTOR_CONSTANTS(md5);
98d66e
     INIT_CONSTRUCTOR_CONSTANTS(sha1);
98d66e
98d66e
From d7339af75678c760f6d6c0eb455b0eb889c22574 Mon Sep 17 00:00:00 2001
98d66e
From: Petr Viktorin <pviktori@redhat.com>
98d66e
Date: Mon, 2 Sep 2019 18:02:25 +0200
98d66e
Subject: [PATCH 02/11] Add the usedforsecurity argument to _hashopenssl
98d66e
98d66e
---
98d66e
 Modules/_hashopenssl.c | 63 ++++++++++++++++++++++++++++++++----------
98d66e
 1 file changed, 48 insertions(+), 15 deletions(-)
98d66e
98d66e
diff --git a/Modules/_hashopenssl.c b/Modules/_hashopenssl.c
98d66e
index cb81e9765251..f2dbc095cc66 100644
98d66e
--- a/Modules/_hashopenssl.c
98d66e
+++ b/Modules/_hashopenssl.c
98d66e
@@ -441,7 +441,7 @@ static PyTypeObject EVPtype = {
98d66e
 static PyObject *
98d66e
 EVPnew(PyObject *name_obj,
98d66e
        const EVP_MD *digest, const EVP_MD_CTX *initial_ctx,
98d66e
-       const unsigned char *cp, Py_ssize_t len)
98d66e
+       const unsigned char *cp, Py_ssize_t len, int usedforsecurity)
98d66e
 {
98d66e
     EVPobject *self;
98d66e
 
98d66e
@@ -456,7 +456,23 @@ EVPnew(PyObject *name_obj,
98d66e
     if (initial_ctx) {
98d66e
         EVP_MD_CTX_copy(self->ctx, initial_ctx);
98d66e
     } else {
98d66e
-        EVP_DigestInit(self->ctx, digest);
98d66e
+        EVP_MD_CTX_init(self->ctx);
98d66e
+
98d66e
+        /*
98d66e
+        If the user has declared that this digest is being used in a
98d66e
+        non-security role (e.g. indexing into a data structure), set
98d66e
+        the exception flag for openssl to allow it
98d66e
+        */
98d66e
+        if (!usedforsecurity) {
98d66e
+#ifdef EVP_MD_CTX_FLAG_NON_FIPS_ALLOW
98d66e
+            EVP_MD_CTX_set_flags(self->ctx, EVP_MD_CTX_FLAG_NON_FIPS_ALLOW);
98d66e
+#endif
98d66e
+        }
98d66e
+        if (!EVP_DigestInit_ex(self->ctx, digest, NULL)) {
98d66e
+            _setException(PyExc_ValueError);
98d66e
+            Py_DECREF(self);
98d66e
+            return NULL;
98d66e
+        }
98d66e
     }
98d66e
 
98d66e
     if (cp && len) {
98d66e
@@ -485,15 +501,16 @@ The MD5 and SHA1 algorithms are always supported.\n");
98d66e
 static PyObject *
98d66e
 EVP_new(PyObject *self, PyObject *args, PyObject *kwdict)
98d66e
 {
98d66e
-    static char *kwlist[] = {"name", "string", NULL};
98d66e
+    static char *kwlist[] = {"name", "string", "usedforsecurity", NULL};
98d66e
     PyObject *name_obj = NULL;
98d66e
     Py_buffer view = { 0 };
98d66e
     PyObject *ret_obj;
98d66e
     char *name;
98d66e
     const EVP_MD *digest;
98d66e
+    int usedforsecurity = 1;
98d66e
 
98d66e
-    if (!PyArg_ParseTupleAndKeywords(args, kwdict, "O|s*:new", kwlist,
98d66e
-                                     &name_obj, &view)) {
98d66e
+    if (!PyArg_ParseTupleAndKeywords(args, kwdict, "O|s*i:new", kwlist,
98d66e
+                                     &name_obj, &view, &usedforsecurity)) {
98d66e
         return NULL;
98d66e
     }
98d66e
 
98d66e
@@ -506,7 +523,7 @@ EVP_new(PyObject *self, PyObject *args, PyObject *kwdict)
98d66e
     digest = EVP_get_digestbyname(name);
98d66e
 
98d66e
     ret_obj = EVPnew(name_obj, digest, NULL, (unsigned char*)view.buf,
98d66e
-                     view.len);
98d66e
+                     view.len, usedforsecurity);
98d66e
     PyBuffer_Release(&view);
98d66e
 
98d66e
     return ret_obj;
98d66e
@@ -771,30 +788,46 @@ generate_hash_name_list(void)
98d66e
  *  the generic one passing it a python string and are noticeably
98d66e
  *  faster than calling a python new() wrapper.  Thats important for
98d66e
  *  code that wants to make hashes of a bunch of small strings.
98d66e
+ *
98d66e
+ *  For usedforsecurity=False, the optimization is not used.
98d66e
  */
98d66e
 #define GEN_CONSTRUCTOR(NAME)  \
98d66e
     static PyObject * \
98d66e
-    EVP_new_ ## NAME (PyObject *self, PyObject *args) \
98d66e
+    EVP_new_ ## NAME (PyObject *self, PyObject *args, PyObject *kwdict) \
98d66e
     { \
98d66e
+        static char *kwlist[] = {"string", "usedforsecurity", NULL}; \
98d66e
         Py_buffer view = { 0 }; \
98d66e
         PyObject *ret_obj; \
98d66e
+        int usedforsecurity=1; \
98d66e
      \
98d66e
-        if (!PyArg_ParseTuple(args, "|s*:" #NAME , &view)) { \
98d66e
+        if (!PyArg_ParseTupleAndKeywords( \
98d66e
+            args, kwdict, "|s*i:" #NAME, kwlist, \
98d66e
+            &view, &usedforsecurity \
98d66e
+        )) { \
98d66e
             return NULL; \
98d66e
         } \
98d66e
-     \
98d66e
-        ret_obj = EVPnew( \
98d66e
-                    CONST_ ## NAME ## _name_obj, \
98d66e
-                    NULL, \
98d66e
-                    CONST_new_ ## NAME ## _ctx_p, \
98d66e
-                    (unsigned char*)view.buf, view.len); \
98d66e
+        if (usedforsecurity == 0) { \
98d66e
+            ret_obj = EVPnew( \
98d66e
+                        CONST_ ## NAME ## _name_obj, \
98d66e
+                        EVP_get_digestbyname(#NAME), \
98d66e
+                        NULL, \
98d66e
+                        (unsigned char*)view.buf, view.len, \
98d66e
+                        usedforsecurity); \
98d66e
+        } else { \
98d66e
+            ret_obj = EVPnew( \
98d66e
+                        CONST_ ## NAME ## _name_obj, \
98d66e
+                        NULL, \
98d66e
+                        CONST_new_ ## NAME ## _ctx_p, \
98d66e
+                        (unsigned char*)view.buf, view.len, \
98d66e
+                        usedforsecurity); \
98d66e
+        } \
98d66e
         PyBuffer_Release(&view); \
98d66e
         return ret_obj; \
98d66e
     }
98d66e
 
98d66e
 /* a PyMethodDef structure for the constructor */
98d66e
 #define CONSTRUCTOR_METH_DEF(NAME)  \
98d66e
-    {"openssl_" #NAME, (PyCFunction)EVP_new_ ## NAME, METH_VARARGS, \
98d66e
+    {"openssl_" #NAME, (PyCFunction)EVP_new_ ## NAME, METH_VARARGS|METH_KEYWORDS, \
98d66e
         PyDoc_STR("Returns a " #NAME \
98d66e
                   " hash object; optionally initialized with a string") \
98d66e
     }
98d66e
98d66e
From c8102e61fb3ade364d4bb7f2fe3f3452e2018ecd Mon Sep 17 00:00:00 2001
98d66e
From: David Malcolm <dmalcolm@redhat.com>
98d66e
Date: Mon, 2 Sep 2019 17:59:53 +0200
98d66e
Subject: [PATCH 03/11] hashlib.py: Avoid the builtin constructor
98d66e
98d66e
---
98d66e
 Lib/hashlib.py | 58 +++++++++++++-------------------------------------
98d66e
 1 file changed, 15 insertions(+), 43 deletions(-)
98d66e
98d66e
diff --git a/Lib/hashlib.py b/Lib/hashlib.py
98d66e
index bbd06b9996ee..404ed6891fb9 100644
98d66e
--- a/Lib/hashlib.py
98d66e
+++ b/Lib/hashlib.py
98d66e
@@ -69,65 +69,37 @@
98d66e
                                 'pbkdf2_hmac')
98d66e
 
98d66e
 
98d66e
-def __get_builtin_constructor(name):
98d66e
-    try:
98d66e
-        if name in ('SHA1', 'sha1'):
98d66e
-            import _sha
98d66e
-            return _sha.new
98d66e
-        elif name in ('MD5', 'md5'):
98d66e
-            import _md5
98d66e
-            return _md5.new
98d66e
-        elif name in ('SHA256', 'sha256', 'SHA224', 'sha224'):
98d66e
-            import _sha256
98d66e
-            bs = name[3:]
98d66e
-            if bs == '256':
98d66e
-                return _sha256.sha256
98d66e
-            elif bs == '224':
98d66e
-                return _sha256.sha224
98d66e
-        elif name in ('SHA512', 'sha512', 'SHA384', 'sha384'):
98d66e
-            import _sha512
98d66e
-            bs = name[3:]
98d66e
-            if bs == '512':
98d66e
-                return _sha512.sha512
98d66e
-            elif bs == '384':
98d66e
-                return _sha512.sha384
98d66e
-    except ImportError:
98d66e
-        pass  # no extension module, this hash is unsupported.
98d66e
-
98d66e
-    raise ValueError('unsupported hash type ' + name)
98d66e
-
98d66e
-
98d66e
 def __get_openssl_constructor(name):
98d66e
     try:
98d66e
         f = getattr(_hashlib, 'openssl_' + name)
98d66e
         # Allow the C module to raise ValueError.  The function will be
98d66e
         # defined but the hash not actually available thanks to OpenSSL.
98d66e
-        f()
98d66e
+        #
98d66e
+        # We pass "usedforsecurity=False" to disable FIPS-based restrictions:
98d66e
+        # at this stage we're merely seeing if the function is callable,
98d66e
+        # rather than using it for actual work.
98d66e
+        f(usedforsecurity=False)
98d66e
         # Use the C function directly (very fast)
98d66e
         return f
98d66e
     except (AttributeError, ValueError):
98d66e
-        return __get_builtin_constructor(name)
98d66e
-
98d66e
-
98d66e
-def __py_new(name, string=''):
98d66e
-    """new(name, string='') - Return a new hashing object using the named algorithm;
98d66e
-    optionally initialized with a string.
98d66e
-    """
98d66e
-    return __get_builtin_constructor(name)(string)
98d66e
+        raise
98d66e
 
98d66e
 
98d66e
-def __hash_new(name, string=''):
98d66e
-    """new(name, string='') - Return a new hashing object using the named algorithm;
98d66e
-    optionally initialized with a string.
98d66e
+def __hash_new(name, string='', usedforsecurity=True):
98d66e
+    """new(name, string='', usedforsecurity=True) - Return a new hashing object
98d66e
+    using the named algorithm; optionally initialized with a string.
98d66e
+    
98d66e
+    Override 'usedforsecurity' to False when using for non-security purposes in
98d66e
+    a FIPS environment
98d66e
     """
98d66e
     try:
98d66e
-        return _hashlib.new(name, string)
98d66e
+        return _hashlib.new(name, string, usedforsecurity)
98d66e
     except ValueError:
98d66e
         # If the _hashlib module (OpenSSL) doesn't support the named
98d66e
         # hash, try using our builtin implementations.
98d66e
         # This allows for SHA224/256 and SHA384/512 support even though
98d66e
         # the OpenSSL library prior to 0.9.8 doesn't provide them.
98d66e
-        return __get_builtin_constructor(name)(string)
98d66e
+        raise
98d66e
 
98d66e
 
98d66e
 try:
98d66e
@@ -218,4 +190,4 @@ def prf(msg, inner=inner, outer=outer):
98d66e
 
98d66e
 # Cleanup locals()
98d66e
 del __always_supported, __func_name, __get_hash
98d66e
-del __py_new, __hash_new, __get_openssl_constructor
98d66e
+del __hash_new, __get_openssl_constructor
98d66e
98d66e
From 2ade3e5a6c5732c0692c4cc2235a2bbe0948f50b Mon Sep 17 00:00:00 2001
98d66e
From: David Malcolm <dmalcolm@redhat.com>
98d66e
Date: Mon, 2 Sep 2019 17:56:46 +0200
98d66e
Subject: [PATCH 04/11] Adjust docstrings & comments
98d66e
98d66e
---
98d66e
 Lib/hashlib.py         | 29 ++++++++++++++++++++++-------
98d66e
 Modules/_hashopenssl.c |  9 ++++++++-
98d66e
 2 files changed, 30 insertions(+), 8 deletions(-)
98d66e
98d66e
diff --git a/Lib/hashlib.py b/Lib/hashlib.py
98d66e
index 404ed6891fb9..46d0b470ab4a 100644
98d66e
--- a/Lib/hashlib.py
98d66e
+++ b/Lib/hashlib.py
98d66e
@@ -6,9 +6,12 @@
98d66e
 
98d66e
 __doc__ = """hashlib module - A common interface to many hash functions.
98d66e
 
98d66e
-new(name, string='') - returns a new hash object implementing the
98d66e
-                       given hash function; initializing the hash
98d66e
-                       using the given string data.
98d66e
+new(name, string='', usedforsecurity=True)
98d66e
+     - returns a new hash object implementing the given hash function;
98d66e
+       initializing the hash using the given string data.
98d66e
+
98d66e
+       "usedforsecurity" is a non-standard extension for better supporting
98d66e
+       FIPS-compliant environments (see below)
98d66e
 
98d66e
 Named constructor functions are also available, these are much faster
98d66e
 than using new():
98d66e
@@ -25,6 +28,20 @@
98d66e
 Choose your hash function wisely.  Some have known collision weaknesses.
98d66e
 sha384 and sha512 will be slow on 32 bit platforms.
98d66e
 
98d66e
+Our implementation of hashlib uses OpenSSL.
98d66e
+
98d66e
+OpenSSL has a "FIPS mode", which, if enabled, may restrict the available hashes
98d66e
+to only those that are compliant with FIPS regulations.  For example, it may
98d66e
+deny the use of MD5, on the grounds that this is not secure for uses such as
98d66e
+authentication, system integrity checking, or digital signatures.
98d66e
+
98d66e
+If you need to use such a hash for non-security purposes (such as indexing into
98d66e
+a data structure for speed), you can override the keyword argument
98d66e
+"usedforsecurity" from True to False to signify that your code is not relying
98d66e
+on the hash for security purposes, and this will allow the hash to be usable
98d66e
+even in FIPS mode.  This is not a standard feature of Python 2.7's hashlib, and
98d66e
+is included here to better support FIPS mode.
98d66e
+
98d66e
 Hash objects have these methods:
98d66e
  - update(arg): Update the hash object with the string arg. Repeated calls
98d66e
                 are equivalent to a single call with the concatenation of all
98d66e
@@ -82,6 +99,7 @@ def __get_openssl_constructor(name):
98d66e
         # Use the C function directly (very fast)
98d66e
         return f
98d66e
     except (AttributeError, ValueError):
98d66e
+        # RHEL only: Fallbacks removed; we always use OpenSSL for hashes.
98d66e
         raise
98d66e
 
98d66e
 
98d66e
@@ -95,10 +113,7 @@ def __hash_new(name, string='', usedforsecurity=True):
98d66e
     try:
98d66e
         return _hashlib.new(name, string, usedforsecurity)
98d66e
     except ValueError:
98d66e
-        # If the _hashlib module (OpenSSL) doesn't support the named
98d66e
-        # hash, try using our builtin implementations.
98d66e
-        # This allows for SHA224/256 and SHA384/512 support even though
98d66e
-        # the OpenSSL library prior to 0.9.8 doesn't provide them.
98d66e
+        # RHEL only: Fallbacks removed; we always use OpenSSL for hashes.
98d66e
         raise
98d66e
 
98d66e
 
98d66e
diff --git a/Modules/_hashopenssl.c b/Modules/_hashopenssl.c
98d66e
index f2dbc095cc66..d24432e048bf 100644
98d66e
--- a/Modules/_hashopenssl.c
98d66e
+++ b/Modules/_hashopenssl.c
98d66e
@@ -496,7 +496,14 @@ PyDoc_STRVAR(EVP_new__doc__,
98d66e
 An optional string argument may be provided and will be\n\
98d66e
 automatically hashed.\n\
98d66e
 \n\
98d66e
-The MD5 and SHA1 algorithms are always supported.\n");
98d66e
+The MD5 and SHA1 algorithms are always supported.\n \
98d66e
+\n\
98d66e
+An optional \"usedforsecurity=True\" keyword argument is provided for use in\n\
98d66e
+environments that enforce FIPS-based restrictions.  Some implementations of\n\
98d66e
+OpenSSL can be configured to prevent the usage of non-secure algorithms (such\n\
98d66e
+as MD5).  If you have a non-security use for these algorithms (e.g. a hash\n\
98d66e
+table), you can override this argument by marking the callsite as\n\
98d66e
+\"usedforsecurity=False\".");
98d66e
 
98d66e
 static PyObject *
98d66e
 EVP_new(PyObject *self, PyObject *args, PyObject *kwdict)
98d66e
98d66e
From 6698e1d84c3f19bbb4438b2b2c78a5ef8bd5ad42 Mon Sep 17 00:00:00 2001
98d66e
From: Petr Viktorin <pviktori@redhat.com>
98d66e
Date: Thu, 29 Aug 2019 10:25:28 +0200
98d66e
Subject: [PATCH 05/11] Expose OpenSSL FIPS_mode as _hashlib.get_fips_mode
98d66e
98d66e
---
98d66e
 Modules/_hashopenssl.c | 22 ++++++++++++++++++++++
98d66e
 1 file changed, 22 insertions(+)
98d66e
98d66e
diff --git a/Modules/_hashopenssl.c b/Modules/_hashopenssl.c
98d66e
index d24432e048bf..74f9ab9ec150 100644
98d66e
--- a/Modules/_hashopenssl.c
98d66e
+++ b/Modules/_hashopenssl.c
98d66e
@@ -860,10 +860,32 @@ GEN_CONSTRUCTOR(sha384)
98d66e
 GEN_CONSTRUCTOR(sha512)
98d66e
 #endif
98d66e
 
98d66e
+static PyObject *
98d66e
+_hashlib_get_fips_mode(PyObject *module, PyObject *unused)
98d66e
+{
98d66e
+    // XXX: This function skips error checking.
98d66e
+    // This is only appropriate for RHEL.
98d66e
+
98d66e
+    // From the OpenSSL docs:
98d66e
+    // "If the library was built without support of the FIPS Object Module,
98d66e
+    // then the function will return 0 with an error code of
98d66e
+    // CRYPTO_R_FIPS_MODE_NOT_SUPPORTED (0x0f06d065)."
98d66e
+    // In RHEL:
98d66e
+    // * we do build with FIPS, so the function always succeeds
98d66e
+    // * even if it didn't, people seem used to errors being left on the
98d66e
+    //   OpenSSL error stack.
98d66e
+
98d66e
+    // For more info, see:
98d66e
+    //  https://bugzilla.redhat.com/show_bug.cgi?id=1745499
98d66e
+
98d66e
+    return PyInt_FromLong(FIPS_mode());
98d66e
+}
98d66e
+
98d66e
 /* List of functions exported by this module */
98d66e
 
98d66e
 static struct PyMethodDef EVP_functions[] = {
98d66e
     {"new", (PyCFunction)EVP_new, METH_VARARGS|METH_KEYWORDS, EVP_new__doc__},
98d66e
+    {"get_fips_mode", (PyCFunction)_hashlib_get_fips_mode, METH_NOARGS, NULL},
98d66e
     CONSTRUCTOR_METH_DEF(md5),
98d66e
     CONSTRUCTOR_METH_DEF(sha1),
98d66e
 #ifdef _OPENSSL_SUPPORTS_SHA2
98d66e
98d66e
From 9a8833619658c6be5ca72c60189a64da05536d85 Mon Sep 17 00:00:00 2001
98d66e
From: David Malcolm <dmalcolm@redhat.com>
98d66e
Date: Mon, 2 Sep 2019 18:00:26 +0200
98d66e
Subject: [PATCH 06/11] Adjust tests
98d66e
98d66e
---
98d66e
 Lib/test/test_hashlib.py | 118 ++++++++++++++++++++++++---------------
98d66e
 1 file changed, 74 insertions(+), 44 deletions(-)
98d66e
98d66e
diff --git a/Lib/test/test_hashlib.py b/Lib/test/test_hashlib.py
98d66e
index b8d6388feaf9..b03fc84f82b4 100644
98d66e
--- a/Lib/test/test_hashlib.py
98d66e
+++ b/Lib/test/test_hashlib.py
98d66e
@@ -34,6 +34,8 @@ def hexstr(s):
98d66e
         r = r + h[(i >> 4) & 0xF] + h[i & 0xF]
98d66e
     return r
98d66e
 
98d66e
+from _hashlib import get_fips_mode
98d66e
+
98d66e
 
98d66e
 class HashLibTestCase(unittest.TestCase):
98d66e
     supported_hash_names = ( 'md5', 'MD5', 'sha1', 'SHA1',
98d66e
@@ -63,10 +65,10 @@ def __init__(self, *args, **kwargs):
98d66e
         # of hashlib.new given the algorithm name.
98d66e
         for algorithm, constructors in self.constructors_to_test.items():
98d66e
             constructors.add(getattr(hashlib, algorithm))
98d66e
-            def _test_algorithm_via_hashlib_new(data=None, _alg=algorithm):
98d66e
+            def _test_algorithm_via_hashlib_new(data=None, _alg=algorithm, usedforsecurity=True):
98d66e
                 if data is None:
98d66e
-                    return hashlib.new(_alg)
98d66e
-                return hashlib.new(_alg, data)
98d66e
+                    return hashlib.new(_alg, usedforsecurity=usedforsecurity)
98d66e
+                return hashlib.new(_alg, data, usedforsecurity=usedforsecurity)
98d66e
             constructors.add(_test_algorithm_via_hashlib_new)
98d66e
 
98d66e
         _hashlib = self._conditional_import_module('_hashlib')
98d66e
@@ -80,28 +82,13 @@ def _test_algorithm_via_hashlib_new(data=None, _alg=algorithm):
98d66e
                 if constructor:
98d66e
                     constructors.add(constructor)
98d66e
 
98d66e
-        _md5 = self._conditional_import_module('_md5')
98d66e
-        if _md5:
98d66e
-            self.constructors_to_test['md5'].add(_md5.new)
98d66e
-        _sha = self._conditional_import_module('_sha')
98d66e
-        if _sha:
98d66e
-            self.constructors_to_test['sha1'].add(_sha.new)
98d66e
-        _sha256 = self._conditional_import_module('_sha256')
98d66e
-        if _sha256:
98d66e
-            self.constructors_to_test['sha224'].add(_sha256.sha224)
98d66e
-            self.constructors_to_test['sha256'].add(_sha256.sha256)
98d66e
-        _sha512 = self._conditional_import_module('_sha512')
98d66e
-        if _sha512:
98d66e
-            self.constructors_to_test['sha384'].add(_sha512.sha384)
98d66e
-            self.constructors_to_test['sha512'].add(_sha512.sha512)
98d66e
-
98d66e
         super(HashLibTestCase, self).__init__(*args, **kwargs)
98d66e
 
98d66e
     def test_hash_array(self):
98d66e
         a = array.array("b", range(10))
98d66e
         constructors = self.constructors_to_test.itervalues()
98d66e
         for cons in itertools.chain.from_iterable(constructors):
98d66e
-            c = cons(a)
98d66e
+            c = cons(a, usedforsecurity=False)
98d66e
             c.hexdigest()
98d66e
 
98d66e
     def test_algorithms_attribute(self):
98d66e
@@ -122,28 +109,9 @@ def test_unknown_hash(self):
98d66e
         self.assertRaises(ValueError, hashlib.new, 'spam spam spam spam spam')
98d66e
         self.assertRaises(TypeError, hashlib.new, 1)
98d66e
 
98d66e
-    def test_get_builtin_constructor(self):
98d66e
-        get_builtin_constructor = hashlib.__dict__[
98d66e
-                '__get_builtin_constructor']
98d66e
-        self.assertRaises(ValueError, get_builtin_constructor, 'test')
98d66e
-        try:
98d66e
-            import _md5
98d66e
-        except ImportError:
98d66e
-            pass
98d66e
-        # This forces an ImportError for "import _md5" statements
98d66e
-        sys.modules['_md5'] = None
98d66e
-        try:
98d66e
-            self.assertRaises(ValueError, get_builtin_constructor, 'md5')
98d66e
-        finally:
98d66e
-            if '_md5' in locals():
98d66e
-                sys.modules['_md5'] = _md5
98d66e
-            else:
98d66e
-                del sys.modules['_md5']
98d66e
-        self.assertRaises(TypeError, get_builtin_constructor, 3)
98d66e
-
98d66e
     def test_hexdigest(self):
98d66e
         for name in self.supported_hash_names:
98d66e
-            h = hashlib.new(name)
98d66e
+            h = hashlib.new(name, usedforsecurity=False)
98d66e
             self.assertTrue(hexstr(h.digest()) == h.hexdigest())
98d66e
 
98d66e
     def test_large_update(self):
98d66e
@@ -153,16 +121,16 @@ def test_large_update(self):
98d66e
         abcs = aas + bees + cees
98d66e
 
98d66e
         for name in self.supported_hash_names:
98d66e
-            m1 = hashlib.new(name)
98d66e
+            m1 = hashlib.new(name, usedforsecurity=False)
98d66e
             m1.update(aas)
98d66e
             m1.update(bees)
98d66e
             m1.update(cees)
98d66e
 
98d66e
-            m2 = hashlib.new(name)
98d66e
+            m2 = hashlib.new(name, usedforsecurity=False)
98d66e
             m2.update(abcs)
98d66e
             self.assertEqual(m1.digest(), m2.digest(), name+' update problem.')
98d66e
 
98d66e
-            m3 = hashlib.new(name, abcs)
98d66e
+            m3 = hashlib.new(name, abcs, usedforsecurity=False)
98d66e
             self.assertEqual(m1.digest(), m3.digest(), name+' new problem.')
98d66e
 
98d66e
     def check(self, name, data, digest):
98d66e
@@ -170,7 +138,7 @@ def check(self, name, data, digest):
98d66e
         # 2 is for hashlib.name(...) and hashlib.new(name, ...)
98d66e
         self.assertGreaterEqual(len(constructors), 2)
98d66e
         for hash_object_constructor in constructors:
98d66e
-            computed = hash_object_constructor(data).hexdigest()
98d66e
+            computed = hash_object_constructor(data, usedforsecurity=False).hexdigest()
98d66e
             self.assertEqual(
98d66e
                     computed, digest,
98d66e
                     "Hash algorithm %s constructed using %s returned hexdigest"
98d66e
@@ -195,7 +163,7 @@ def check_update(self, name, data, digest):
98d66e
 
98d66e
     def check_unicode(self, algorithm_name):
98d66e
         # Unicode objects are not allowed as input.
98d66e
-        expected = hashlib.new(algorithm_name, str(u'spam')).hexdigest()
98d66e
+        expected = hashlib.new(algorithm_name, str(u'spam'), usedforsecurity=False).hexdigest()
98d66e
         self.check(algorithm_name, u'spam', expected)
98d66e
 
98d66e
     def test_unicode(self):
98d66e
@@ -393,6 +361,68 @@ def hash_in_chunks(chunk_size):
98d66e
 
98d66e
         self.assertEqual(expected_hash, hasher.hexdigest())
98d66e
 
98d66e
+    def test_issue9146(self):
98d66e
+        # Ensure that various ways to use "MD5" from "hashlib" don't segfault:
98d66e
+        m = hashlib.md5(usedforsecurity=False)
98d66e
+        m.update(b'abc\n')
98d66e
+        self.assertEquals(m.hexdigest(), "0bee89b07a248e27c83fc3d5951213c1")
98d66e
+
98d66e
+        m = hashlib.new('md5', usedforsecurity=False)
98d66e
+        m.update(b'abc\n')
98d66e
+        self.assertEquals(m.hexdigest(), "0bee89b07a248e27c83fc3d5951213c1")
98d66e
+
98d66e
+        m = hashlib.md5(b'abc\n', usedforsecurity=False)
98d66e
+        self.assertEquals(m.hexdigest(), "0bee89b07a248e27c83fc3d5951213c1")
98d66e
+
98d66e
+        m = hashlib.new('md5', b'abc\n', usedforsecurity=False)
98d66e
+        self.assertEquals(m.hexdigest(), "0bee89b07a248e27c83fc3d5951213c1")
98d66e
+
98d66e
+    def assertRaisesDisabledForFIPS(self, callable_obj=None, *args, **kwargs):
98d66e
+        try:
98d66e
+            callable_obj(*args, **kwargs)
98d66e
+        except ValueError, e:
98d66e
+            if not e.args[0].endswith('disabled for FIPS'):
98d66e
+                self.fail('Incorrect exception raised')
98d66e
+        else:
98d66e
+            self.fail('Exception was not raised')
98d66e
+
98d66e
+    @unittest.skipUnless(get_fips_mode(),
98d66e
+                         'FIPS enforcement required for this test.')
98d66e
+    def test_hashlib_fips_mode(self):
98d66e
+        # Ensure that we raise a ValueError on vanilla attempts to use MD5
98d66e
+        # in hashlib in a FIPS-enforced setting:
98d66e
+        self.assertRaisesDisabledForFIPS(hashlib.md5)
98d66e
+        self.assertRaisesDisabledForFIPS(hashlib.new, 'md5')
98d66e
+
98d66e
+    @unittest.skipUnless(get_fips_mode(),
98d66e
+                         'FIPS enforcement required for this test.')
98d66e
+    def test_hashopenssl_fips_mode(self):
98d66e
+        # Verify the _hashlib module's handling of md5:
98d66e
+        import _hashlib
98d66e
+
98d66e
+        assert hasattr(_hashlib, 'openssl_md5')
98d66e
+
98d66e
+        # Ensure that _hashlib raises a ValueError on vanilla attempts to
98d66e
+        # use MD5 in a FIPS-enforced setting:
98d66e
+        self.assertRaisesDisabledForFIPS(_hashlib.openssl_md5)
98d66e
+        self.assertRaisesDisabledForFIPS(_hashlib.new, 'md5')
98d66e
+
98d66e
+        # Ensure that in such a setting we can whitelist a callsite with
98d66e
+        # usedforsecurity=False and have it succeed:
98d66e
+        m = _hashlib.openssl_md5(usedforsecurity=False)
98d66e
+        m.update('abc\n')
98d66e
+        self.assertEquals(m.hexdigest(), "0bee89b07a248e27c83fc3d5951213c1")
98d66e
+
98d66e
+        m = _hashlib.new('md5', usedforsecurity=False)
98d66e
+        m.update('abc\n')
98d66e
+        self.assertEquals(m.hexdigest(), "0bee89b07a248e27c83fc3d5951213c1")
98d66e
+
98d66e
+        m = _hashlib.openssl_md5('abc\n', usedforsecurity=False)
98d66e
+        self.assertEquals(m.hexdigest(), "0bee89b07a248e27c83fc3d5951213c1")
98d66e
+
98d66e
+        m = _hashlib.new('md5', 'abc\n', usedforsecurity=False)
98d66e
+        self.assertEquals(m.hexdigest(), "0bee89b07a248e27c83fc3d5951213c1")
98d66e
+
98d66e
 
98d66e
 class KDFTests(unittest.TestCase):
98d66e
     pbkdf2_test_vectors = [
98d66e
98d66e
From 31e527aa4f57845dfb0c3dd4f0e9192af5a5b4e2 Mon Sep 17 00:00:00 2001
98d66e
From: David Malcolm <dmalcolm@redhat.com>
98d66e
Date: Mon, 2 Sep 2019 18:00:47 +0200
98d66e
Subject: [PATCH 07/11] Don't build non-OpenSSL hash implementations
98d66e
98d66e
---
98d66e
 setup.py | 15 ---------------
98d66e
 1 file changed, 15 deletions(-)
98d66e
98d66e
diff --git a/setup.py b/setup.py
98d66e
index 33cecc687573..272d2f1b5bb8 100644
98d66e
--- a/setup.py
98d66e
+++ b/setup.py
98d66e
@@ -874,21 +874,6 @@ def detect_modules(self):
98d66e
                 print ("warning: openssl 0x%08x is too old for _hashlib" %
98d66e
                        openssl_ver)
98d66e
                 missing.append('_hashlib')
98d66e
-        if COMPILED_WITH_PYDEBUG or not have_usable_openssl:
98d66e
-            # The _sha module implements the SHA1 hash algorithm.
98d66e
-            exts.append( Extension('_sha', ['shamodule.c']) )
98d66e
-            # The _md5 module implements the RSA Data Security, Inc. MD5
98d66e
-            # Message-Digest Algorithm, described in RFC 1321.  The
98d66e
-            # necessary files md5.c and md5.h are included here.
98d66e
-            exts.append( Extension('_md5',
98d66e
-                            sources = ['md5module.c', 'md5.c'],
98d66e
-                            depends = ['md5.h']) )
98d66e
-
98d66e
-        min_sha2_openssl_ver = 0x00908000
98d66e
-        if COMPILED_WITH_PYDEBUG or openssl_ver < min_sha2_openssl_ver:
98d66e
-            # OpenSSL doesn't do these until 0.9.8 so we'll bring our own hash
98d66e
-            exts.append( Extension('_sha256', ['sha256module.c']) )
98d66e
-            exts.append( Extension('_sha512', ['sha512module.c']) )
98d66e
 
98d66e
         # Modules that provide persistent dictionary-like semantics.  You will
98d66e
         # probably want to arrange for at least one of them to be available on
98d66e
98d66e
From e9cd6a63ce17a0120b1d017bf08f05f3ed223bb1 Mon Sep 17 00:00:00 2001
98d66e
From: Petr Viktorin <pviktori@redhat.com>
98d66e
Date: Mon, 2 Sep 2019 18:33:22 +0200
98d66e
Subject: [PATCH 08/11] Allow for errros in pre-created context creation
98d66e
98d66e
---
98d66e
 Modules/_hashopenssl.c | 6 ++++--
98d66e
 1 file changed, 4 insertions(+), 2 deletions(-)
98d66e
98d66e
diff --git a/Modules/_hashopenssl.c b/Modules/_hashopenssl.c
98d66e
index 74f9ab9ec150..7609e9e490f0 100644
98d66e
--- a/Modules/_hashopenssl.c
98d66e
+++ b/Modules/_hashopenssl.c
98d66e
@@ -813,7 +813,7 @@ generate_hash_name_list(void)
98d66e
         )) { \
98d66e
             return NULL; \
98d66e
         } \
98d66e
-        if (usedforsecurity == 0) { \
98d66e
+        if (usedforsecurity == 0 || CONST_new_ ## NAME ## _ctx_p == NULL) { \
98d66e
             ret_obj = EVPnew( \
98d66e
                         CONST_ ## NAME ## _name_obj, \
98d66e
                         EVP_get_digestbyname(#NAME), \
98d66e
@@ -846,7 +846,9 @@ generate_hash_name_list(void)
98d66e
     CONST_ ## NAME ## _name_obj = PyString_FromString(#NAME); \
98d66e
         if (EVP_get_digestbyname(#NAME)) { \
98d66e
             CONST_new_ ## NAME ## _ctx_p = EVP_MD_CTX_new(); \
98d66e
-            EVP_DigestInit(CONST_new_ ## NAME ## _ctx_p, EVP_get_digestbyname(#NAME)); \
98d66e
+            if (!EVP_DigestInit(CONST_new_ ## NAME ## _ctx_p, EVP_get_digestbyname(#NAME))) { \
98d66e
+                CONST_new_ ## NAME ## _ctx_p = NULL; \
98d66e
+            } \
98d66e
         } \
98d66e
     } \
98d66e
 } while (0);
98d66e
98d66e
From d0465ea1c07f24067b4d6f60f73a29c82f2ad03f Mon Sep 17 00:00:00 2001
98d66e
From: David Malcolm <dmalcolm@redhat.com>
98d66e
Date: Mon, 2 Sep 2019 18:40:08 +0200
98d66e
Subject: [PATCH 09/11] use SHA-256 rather than MD5 in
98d66e
 multiprocessing.connection (patch 169; rhbz#879695)
98d66e
98d66e
---
98d66e
 Lib/multiprocessing/connection.py | 12 ++++++++++--
98d66e
 1 file changed, 10 insertions(+), 2 deletions(-)
98d66e
98d66e
diff --git a/Lib/multiprocessing/connection.py b/Lib/multiprocessing/connection.py
98d66e
index 645a26f069ea..d4dc6ac19d53 100644
98d66e
--- a/Lib/multiprocessing/connection.py
98d66e
+++ b/Lib/multiprocessing/connection.py
98d66e
@@ -56,6 +56,10 @@
98d66e
 # A very generous timeout when it comes to local connections...
98d66e
 CONNECTION_TIMEOUT = 20.
98d66e
 
98d66e
+# The hmac module implicitly defaults to using MD5.
98d66e
+# Support using a stronger algorithm for the challenge/response code:
98d66e
+HMAC_DIGEST_NAME='sha256'
98d66e
+
98d66e
 _mmap_counter = itertools.count()
98d66e
 
98d66e
 default_family = 'AF_INET'
98d66e
@@ -413,12 +417,16 @@ def PipeClient(address):
98d66e
 WELCOME = b'#WELCOME#'
98d66e
 FAILURE = b'#FAILURE#'
98d66e
 
98d66e
+def get_digestmod_for_hmac():
98d66e
+    import hashlib
98d66e
+    return getattr(hashlib, HMAC_DIGEST_NAME)
98d66e
+
98d66e
 def deliver_challenge(connection, authkey):
98d66e
     import hmac
98d66e
     assert isinstance(authkey, bytes)
98d66e
     message = os.urandom(MESSAGE_LENGTH)
98d66e
     connection.send_bytes(CHALLENGE + message)
98d66e
-    digest = hmac.new(authkey, message).digest()
98d66e
+    digest = hmac.new(authkey, message, get_digestmod_for_hmac()).digest()
98d66e
     response = connection.recv_bytes(256)        # reject large message
98d66e
     if response == digest:
98d66e
         connection.send_bytes(WELCOME)
98d66e
@@ -432,7 +440,7 @@ def answer_challenge(connection, authkey):
98d66e
     message = connection.recv_bytes(256)         # reject large message
98d66e
     assert message[:len(CHALLENGE)] == CHALLENGE, 'message = %r' % message
98d66e
     message = message[len(CHALLENGE):]
98d66e
-    digest = hmac.new(authkey, message).digest()
98d66e
+    digest = hmac.new(authkey, message, get_digestmod_for_hmac()).digest()
98d66e
     connection.send_bytes(digest)
98d66e
     response = connection.recv_bytes(256)        # reject large message
98d66e
     if response != WELCOME:
98d66e
98d66e
From 82b181a2c55be0f0766fdf1f0a3e950d22fe0602 Mon Sep 17 00:00:00 2001
98d66e
From: Petr Viktorin <pviktori@redhat.com>
98d66e
Date: Mon, 19 Aug 2019 13:59:40 +0200
98d66e
Subject: [PATCH 10/11] Make uuid.uuid3 work (using libuuid via ctypes)
98d66e
98d66e
---
98d66e
 Lib/uuid.py | 8 ++++++++
98d66e
 1 file changed, 8 insertions(+)
98d66e
98d66e
diff --git a/Lib/uuid.py b/Lib/uuid.py
98d66e
index 80d33c0bd83f..bfb7477b5f58 100644
98d66e
--- a/Lib/uuid.py
98d66e
+++ b/Lib/uuid.py
98d66e
@@ -455,6 +455,7 @@ def _netbios_getnode():
98d66e
 
98d66e
 # If ctypes is available, use it to find system routines for UUID generation.
98d66e
 _uuid_generate_time = _UuidCreate = None
98d66e
+_uuid_generate_md5 = None
98d66e
 try:
98d66e
     import ctypes, ctypes.util
98d66e
     import sys
98d66e
@@ -471,6 +472,8 @@ def _netbios_getnode():
98d66e
             continue
98d66e
         if hasattr(lib, 'uuid_generate_time'):
98d66e
             _uuid_generate_time = lib.uuid_generate_time
98d66e
+            # The library that has uuid_generate_time should have md5 too.
98d66e
+            _uuid_generate_md5 = getattr(lib, 'uuid_generate_md5')
98d66e
             break
98d66e
     del _libnames
98d66e
 
98d66e
@@ -595,6 +598,11 @@ def uuid1(node=None, clock_seq=None):
98d66e
 
98d66e
 def uuid3(namespace, name):
98d66e
     """Generate a UUID from the MD5 hash of a namespace UUID and a name."""
98d66e
+    if _uuid_generate_md5:
98d66e
+        _buffer = ctypes.create_string_buffer(16)
98d66e
+        _uuid_generate_md5(_buffer, namespace.bytes, name, len(name))
98d66e
+        return UUID(bytes=_buffer.raw)
98d66e
+
98d66e
     from hashlib import md5
98d66e
     hash = md5(namespace.bytes + name).digest()
98d66e
     return UUID(bytes=hash[:16], version=3)
98d66e