From 7ad40db8ba1a0c0fb5e6b3488561a65909c0b014 Mon Sep 17 00:00:00 2001
From: GYT <tiborgyri@gmail.com>
Date: Sun, 19 Jan 2025 12:31:27 +0100
Subject: [PATCH 1/2] add NaN propagation and array initialization notes to
 gemm docs

---
 BLAS/SRC/cgemm.f | 38 +++++++++++++++++++++++++++++++-------
 BLAS/SRC/dgemm.f | 44 +++++++++++++++++++++++++++++++++++++-------
 BLAS/SRC/sgemm.f | 44 +++++++++++++++++++++++++++++++++++++-------
 BLAS/SRC/zgemm.f | 38 +++++++++++++++++++++++++++++++-------
 4 files changed, 136 insertions(+), 28 deletions(-)

diff --git a/BLAS/SRC/cgemm.f b/BLAS/SRC/cgemm.f
index 6f1846c748..103466fadb 100644
--- a/BLAS/SRC/cgemm.f
+++ b/BLAS/SRC/cgemm.f
@@ -35,6 +35,19 @@
 *>
 *> alpha and beta are scalars, and A, B and C are matrices, with op( A )
 *> an m by k matrix,  op( B )  a  k by n matrix and  C an m by n matrix.
+*>
+*> Note: if alpha and/or beta is zero, some parts of the matrix-matrix
+*>  operations are not performed. This results in the following NaN/Inf
+*>  propagation quirks:
+*>
+*>  1. If alpha is zero and beta is one, NaNs or Infs in A or B do not affect
+*>   the result.
+*>  2. If both alpha and beta are zero, then a zero matrix is returned in C,
+*>   irrespective of any NaNs or Infs in A, B or C.
+*>  3. If alpha is zero and beta is neither zero or one, then beta*C is
+*>   returned in C, irrespective of any NaNs or Infs in A or B.
+*>  4. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
+*>   of any NaNs or Infs in C.
 *> \endverbatim
 *
 *  Arguments:
@@ -92,7 +105,9 @@
 *> \param[in] ALPHA
 *> \verbatim
 *>          ALPHA is COMPLEX
-*>           On entry, ALPHA specifies the scalar alpha.
+*>           On entry, ALPHA specifies the scalar alpha. If ALPHA is zero the
+*>           values in A and B do not affect the result. This also means that
+*>           NaN/Inf propagation from A and B is inhibited if ALPHA is zero.
 *> \endverbatim
 *>
 *> \param[in] A
@@ -102,7 +117,10 @@
 *>           Before entry with  TRANSA = 'N' or 'n',  the leading  m by k
 *>           part of the array  A  must contain the matrix  A,  otherwise
 *>           the leading  k by m  part of the array  A  must contain  the
-*>           matrix A.
+*>           matrix A, except if ALPHA is zero.
+*>           If ALPHA is zero, none of the values in A affect the result, even
+*>           if they are NaN/Inf. This also implies that if ALPHA is zero,
+*>           the matrix elements of A need not be initialized by the caller.
 *> \endverbatim
 *>
 *> \param[in] LDA
@@ -121,7 +139,10 @@
 *>           Before entry with  TRANSB = 'N' or 'n',  the leading  k by n
 *>           part of the array  B  must contain the matrix  B,  otherwise
 *>           the leading  n by k  part of the array  B  must contain  the
-*>           matrix B.
+*>           matrix B, except if ALPHA is zero.
+*>           If ALPHA is zero, none of the values in B affect the result, even
+*>           if they are NaN/Inf. This also implies that if ALPHA is zero,
+*>           the matrix elements of B need not be initialized by the caller.
 *> \endverbatim
 *>
 *> \param[in] LDB
@@ -136,16 +157,19 @@
 *> \param[in] BETA
 *> \verbatim
 *>          BETA is COMPLEX
-*>           On entry,  BETA  specifies the scalar  beta.  When  BETA  is
-*>           supplied as zero then C need not be set on input.
+*>           On entry,  BETA  specifies the scalar  beta. If BETA is zero the
+*>           values in C do not affect the result. This also means that
+*>           NaN/Inf propagation from C is inhibited if BETA is zero.
 *> \endverbatim
 *>
 *> \param[in,out] C
 *> \verbatim
 *>          C is COMPLEX array, dimension ( LDC, N )
 *>           Before entry, the leading  m by n  part of the array  C must
-*>           contain the matrix  C,  except when  beta  is zero, in which
-*>           case C need not be set on entry.
+*>           contain the matrix  C, except if beta is zero.
+*>           If beta is zero, none of the values in C affect the result, even
+*>           if they are NaN/Inf. This also implies that if beta is zero,
+*>           the matrix elements of C need not be initialized by the caller.
 *>           On exit, the array  C  is overwritten by the  m by n  matrix
 *>           ( alpha*op( A )*op( B ) + beta*C ).
 *> \endverbatim
diff --git a/BLAS/SRC/dgemm.f b/BLAS/SRC/dgemm.f
index 1484b1900c..010a22d88e 100644
--- a/BLAS/SRC/dgemm.f
+++ b/BLAS/SRC/dgemm.f
@@ -35,6 +35,19 @@
 *>
 *> alpha and beta are scalars, and A, B and C are matrices, with op( A )
 *> an m by k matrix,  op( B )  a  k by n matrix and  C an m by n matrix.
+*>
+*> Note: if alpha and/or beta is zero, some parts of the matrix-matrix
+*>  operations are not performed. This results in the following NaN/Inf
+*>  propagation quirks:
+*>
+*>  1. If alpha is zero and beta is one, NaNs or Infs in A or B do not affect
+*>   the result.
+*>  2. If both alpha and beta are zero, then a zero matrix is returned in C,
+*>   irrespective of any NaNs or Infs in A, B or C.
+*>  3. If alpha is zero and beta is neither zero or one, then beta*C is
+*>   returned in C, irrespective of any NaNs or Infs in A or B.
+*>  4. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
+*>   of any NaNs or Infs in C.
 *> \endverbatim
 *
 *  Arguments:
@@ -51,6 +64,9 @@
 *>              TRANSA = 'T' or 't',  op( A ) = A**T.
 *>
 *>              TRANSA = 'C' or 'c',  op( A ) = A**T.
+*>
+*>           Note: TRANSA = 'C' is supported for the sake of API consistency
+*>           between all ?GEMM variants.
 *> \endverbatim
 *>
 *> \param[in] TRANSB
@@ -64,6 +80,9 @@
 *>              TRANSB = 'T' or 't',  op( B ) = B**T.
 *>
 *>              TRANSB = 'C' or 'c',  op( B ) = B**T.
+*>
+*>           Note: TRANSB = 'C' is supported for the sake of API consistency
+*>           between all ?GEMM variants.
 *> \endverbatim
 *>
 *> \param[in] M
@@ -92,7 +111,9 @@
 *> \param[in] ALPHA
 *> \verbatim
 *>          ALPHA is DOUBLE PRECISION.
-*>           On entry, ALPHA specifies the scalar alpha.
+*>           On entry, ALPHA specifies the scalar alpha. If ALPHA is zero the
+*>           values in A and B do not affect the result. This also means that
+*>           NaN/Inf propagation from A and B is inhibited if ALPHA is zero.
 *> \endverbatim
 *>
 *> \param[in] A
@@ -102,7 +123,10 @@
 *>           Before entry with  TRANSA = 'N' or 'n',  the leading  m by k
 *>           part of the array  A  must contain the matrix  A,  otherwise
 *>           the leading  k by m  part of the array  A  must contain  the
-*>           matrix A.
+*>           matrix A, except if ALPHA is zero.
+*>           If ALPHA is zero, none of the values in A affect the result, even
+*>           if they are NaN/Inf. This also implies that if ALPHA is zero,
+*>           the matrix elements of A need not be initialized by the caller.
 *> \endverbatim
 *>
 *> \param[in] LDA
@@ -121,7 +145,10 @@
 *>           Before entry with  TRANSB = 'N' or 'n',  the leading  k by n
 *>           part of the array  B  must contain the matrix  B,  otherwise
 *>           the leading  n by k  part of the array  B  must contain  the
-*>           matrix B.
+*>           matrix B, except if ALPHA is zero.
+*>           If ALPHA is zero, none of the values in B affect the result, even
+*>           if they are NaN/Inf. This also implies that if ALPHA is zero,
+*>           the matrix elements of B need not be initialized by the caller.
 *> \endverbatim
 *>
 *> \param[in] LDB
@@ -136,16 +163,19 @@
 *> \param[in] BETA
 *> \verbatim
 *>          BETA is DOUBLE PRECISION.
-*>           On entry,  BETA  specifies the scalar  beta.  When  BETA  is
-*>           supplied as zero then C need not be set on input.
+*>           On entry,  BETA  specifies the scalar  beta.  If BETA is zero the
+*>           values in C do not affect the result. This also means that
+*>           NaN/Inf propagation from C is inhibited if BETA is zero.
 *> \endverbatim
 *>
 *> \param[in,out] C
 *> \verbatim
 *>          C is DOUBLE PRECISION array, dimension ( LDC, N )
 *>           Before entry, the leading  m by n  part of the array  C must
-*>           contain the matrix  C,  except when  beta  is zero, in which
-*>           case C need not be set on entry.
+*>           contain the matrix  C, except if beta is zero.
+*>           If beta is zero, none of the values in C affect the result, even
+*>           if they are NaN/Inf. This also implies that if beta is zero,
+*>           the matrix elements of C need not be initialized by the caller.
 *>           On exit, the array  C  is overwritten by the  m by n  matrix
 *>           ( alpha*op( A )*op( B ) + beta*C ).
 *> \endverbatim
diff --git a/BLAS/SRC/sgemm.f b/BLAS/SRC/sgemm.f
index 3e31add9fa..ed5f3d0a6a 100644
--- a/BLAS/SRC/sgemm.f
+++ b/BLAS/SRC/sgemm.f
@@ -35,6 +35,19 @@
 *>
 *> alpha and beta are scalars, and A, B and C are matrices, with op( A )
 *> an m by k matrix,  op( B )  a  k by n matrix and  C an m by n matrix.
+*>
+*> Note: if alpha and/or beta is zero, some parts of the matrix-matrix
+*>  operations are not performed. This results in the following NaN/Inf
+*>  propagation quirks:
+*>
+*>  1. If alpha is zero and beta is one, NaNs or Infs in A or B do not affect
+*>   the result.
+*>  2. If both alpha and beta are zero, then a zero matrix is returned in C,
+*>   irrespective of any NaNs or Infs in A, B or C.
+*>  3. If alpha is zero and beta is neither zero or one, then beta*C is
+*>   returned in C, irrespective of any NaNs or Infs in A or B.
+*>  4. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
+*>   of any NaNs or Infs in C.
 *> \endverbatim
 *
 *  Arguments:
@@ -51,6 +64,9 @@
 *>              TRANSA = 'T' or 't',  op( A ) = A**T.
 *>
 *>              TRANSA = 'C' or 'c',  op( A ) = A**T.
+*>
+*>           Note: TRANSA = 'C' is supported for the sake of API consistency
+*>           between all ?GEMM variants.
 *> \endverbatim
 *>
 *> \param[in] TRANSB
@@ -64,6 +80,9 @@
 *>              TRANSB = 'T' or 't',  op( B ) = B**T.
 *>
 *>              TRANSB = 'C' or 'c',  op( B ) = B**T.
+*>
+*>           Note: TRANSB = 'C' is supported for the sake of API consistency
+*>           between all ?GEMM variants.
 *> \endverbatim
 *>
 *> \param[in] M
@@ -92,7 +111,9 @@
 *> \param[in] ALPHA
 *> \verbatim
 *>          ALPHA is REAL
-*>           On entry, ALPHA specifies the scalar alpha.
+*>           On entry, ALPHA specifies the scalar alpha. If ALPHA is zero the
+*>           values in A and B do not affect the result. This also means that
+*>           NaN/Inf propagation from A and B is inhibited if ALPHA is zero.
 *> \endverbatim
 *>
 *> \param[in] A
@@ -102,7 +123,10 @@
 *>           Before entry with  TRANSA = 'N' or 'n',  the leading  m by k
 *>           part of the array  A  must contain the matrix  A,  otherwise
 *>           the leading  k by m  part of the array  A  must contain  the
-*>           matrix A.
+*>           matrix A, except if ALPHA is zero.
+*>           If ALPHA is zero, none of the values in A affect the result, even
+*>           if they are NaN/Inf. This also implies that if ALPHA is zero,
+*>           the matrix elements of A need not be initialized by the caller.
 *> \endverbatim
 *>
 *> \param[in] LDA
@@ -121,7 +145,10 @@
 *>           Before entry with  TRANSB = 'N' or 'n',  the leading  k by n
 *>           part of the array  B  must contain the matrix  B,  otherwise
 *>           the leading  n by k  part of the array  B  must contain  the
-*>           matrix B.
+*>           matrix B, except if ALPHA is zero.
+*>           If ALPHA is zero, none of the values in B affect the result, even
+*>           if they are NaN/Inf. This also implies that if ALPHA is zero,
+*>           the matrix elements of B need not be initialized by the caller.
 *> \endverbatim
 *>
 *> \param[in] LDB
@@ -136,16 +163,19 @@
 *> \param[in] BETA
 *> \verbatim
 *>          BETA is REAL
-*>           On entry,  BETA  specifies the scalar  beta.  When  BETA  is
-*>           supplied as zero then C need not be set on input.
+*>           On entry,  BETA  specifies the scalar  beta.  If BETA is zero the
+*>           values in C do not affect the result. This also means that
+*>           NaN/Inf propagation from C is inhibited if BETA is zero.
 *> \endverbatim
 *>
 *> \param[in,out] C
 *> \verbatim
 *>          C is REAL array, dimension ( LDC, N )
 *>           Before entry, the leading  m by n  part of the array  C must
-*>           contain the matrix  C,  except when  beta  is zero, in which
-*>           case C need not be set on entry.
+*>           contain the matrix  C, except if beta is zero.
+*>           If beta is zero, none of the values in C affect the result, even
+*>           if they are NaN/Inf. This also implies that if beta is zero,
+*>           the matrix elements of C need not be initialized by the caller.
 *>           On exit, the array  C  is overwritten by the  m by n  matrix
 *>           ( alpha*op( A )*op( B ) + beta*C ).
 *> \endverbatim
diff --git a/BLAS/SRC/zgemm.f b/BLAS/SRC/zgemm.f
index 366119577f..9ad64f5ffa 100644
--- a/BLAS/SRC/zgemm.f
+++ b/BLAS/SRC/zgemm.f
@@ -35,6 +35,19 @@
 *>
 *> alpha and beta are scalars, and A, B and C are matrices, with op( A )
 *> an m by k matrix,  op( B )  a  k by n matrix and  C an m by n matrix.
+*>
+*> Note: if alpha and/or beta is zero, some parts of the matrix-matrix
+*>  operations are not performed. This results in the following NaN/Inf
+*>  propagation quirks:
+*>
+*>  1. If alpha is zero and beta is one, NaNs or Infs in A or B do not affect
+*>   the result.
+*>  2. If both alpha and beta are zero, then a zero matrix is returned in C,
+*>   irrespective of any NaNs or Infs in A, B or C.
+*>  3. If alpha is zero and beta is neither zero or one, then beta*C is
+*>   returned in C, irrespective of any NaNs or Infs in A or B.
+*>  4. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
+*>   of any NaNs or Infs in C.
 *> \endverbatim
 *
 *  Arguments:
@@ -92,7 +105,9 @@
 *> \param[in] ALPHA
 *> \verbatim
 *>          ALPHA is COMPLEX*16
-*>           On entry, ALPHA specifies the scalar alpha.
+*>           On entry, ALPHA specifies the scalar alpha. If ALPHA is zero the
+*>           values in A and B do not affect the result. This also means that
+*>           NaN/Inf propagation from A and B is inhibited if ALPHA is zero.
 *> \endverbatim
 *>
 *> \param[in] A
@@ -102,7 +117,10 @@
 *>           Before entry with  TRANSA = 'N' or 'n',  the leading  m by k
 *>           part of the array  A  must contain the matrix  A,  otherwise
 *>           the leading  k by m  part of the array  A  must contain  the
-*>           matrix A.
+*>           matrix A, except if ALPHA is zero.
+*>           If ALPHA is zero, none of the values in A affect the result, even
+*>           if they are NaN/Inf. This also implies that if ALPHA is zero,
+*>           the matrix elements of A need not be initialized by the caller.
 *> \endverbatim
 *>
 *> \param[in] LDA
@@ -121,7 +139,10 @@
 *>           Before entry with  TRANSB = 'N' or 'n',  the leading  k by n
 *>           part of the array  B  must contain the matrix  B,  otherwise
 *>           the leading  n by k  part of the array  B  must contain  the
-*>           matrix B.
+*>           matrix B, except if ALPHA is zero.
+*>           If ALPHA is zero, none of the values in B affect the result, even
+*>           if they are NaN/Inf. This also implies that if ALPHA is zero,
+*>           the matrix elements of B need not be initialized by the caller.
 *> \endverbatim
 *>
 *> \param[in] LDB
@@ -136,16 +157,19 @@
 *> \param[in] BETA
 *> \verbatim
 *>          BETA is COMPLEX*16
-*>           On entry,  BETA  specifies the scalar  beta.  When  BETA  is
-*>           supplied as zero then C need not be set on input.
+*>           On entry,  BETA  specifies the scalar  beta. If BETA is zero the
+*>           values in C do not affect the result. This also means that
+*>           NaN/Inf propagation from C is inhibited if BETA is zero.
 *> \endverbatim
 *>
 *> \param[in,out] C
 *> \verbatim
 *>          C is COMPLEX*16 array, dimension ( LDC, N )
 *>           Before entry, the leading  m by n  part of the array  C must
-*>           contain the matrix  C,  except when  beta  is zero, in which
-*>           case C need not be set on entry.
+*>           contain the matrix  C,, except if beta is zero.
+*>           If beta is zero, none of the values in C affect the result, even
+*>           if they are NaN/Inf. This also implies that if beta is zero,
+*>           the matrix elements of C need not be initialized by the caller.
 *>           On exit, the array  C  is overwritten by the  m by n  matrix
 *>           ( alpha*op( A )*op( B ) + beta*C ).
 *> \endverbatim

From 5f79137150a0a3941bd876432c25aad3d4e25cb6 Mon Sep 17 00:00:00 2001
From: GYT <tiborgyri@gmail.com>
Date: Sun, 19 Jan 2025 15:57:34 +0100
Subject: [PATCH 2/2] simplify nan propagation quirks in the purpose section

---
 BLAS/SRC/cgemm.f | 7 ++-----
 BLAS/SRC/dgemm.f | 7 ++-----
 BLAS/SRC/sgemm.f | 7 ++-----
 BLAS/SRC/zgemm.f | 7 ++-----
 4 files changed, 8 insertions(+), 20 deletions(-)

diff --git a/BLAS/SRC/cgemm.f b/BLAS/SRC/cgemm.f
index 103466fadb..7e7965a50c 100644
--- a/BLAS/SRC/cgemm.f
+++ b/BLAS/SRC/cgemm.f
@@ -40,13 +40,10 @@
 *>  operations are not performed. This results in the following NaN/Inf
 *>  propagation quirks:
 *>
-*>  1. If alpha is zero and beta is one, NaNs or Infs in A or B do not affect
-*>   the result.
+*>  1. If alpha is zero, NaNs or Infs in A or B do not affect the result.
 *>  2. If both alpha and beta are zero, then a zero matrix is returned in C,
 *>   irrespective of any NaNs or Infs in A, B or C.
-*>  3. If alpha is zero and beta is neither zero or one, then beta*C is
-*>   returned in C, irrespective of any NaNs or Infs in A or B.
-*>  4. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
+*>  3. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
 *>   of any NaNs or Infs in C.
 *> \endverbatim
 *
diff --git a/BLAS/SRC/dgemm.f b/BLAS/SRC/dgemm.f
index 010a22d88e..f2a7af4fb3 100644
--- a/BLAS/SRC/dgemm.f
+++ b/BLAS/SRC/dgemm.f
@@ -40,13 +40,10 @@
 *>  operations are not performed. This results in the following NaN/Inf
 *>  propagation quirks:
 *>
-*>  1. If alpha is zero and beta is one, NaNs or Infs in A or B do not affect
-*>   the result.
+*>  1. If alpha is zero, NaNs or Infs in A or B do not affect the result.
 *>  2. If both alpha and beta are zero, then a zero matrix is returned in C,
 *>   irrespective of any NaNs or Infs in A, B or C.
-*>  3. If alpha is zero and beta is neither zero or one, then beta*C is
-*>   returned in C, irrespective of any NaNs or Infs in A or B.
-*>  4. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
+*>  3. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
 *>   of any NaNs or Infs in C.
 *> \endverbatim
 *
diff --git a/BLAS/SRC/sgemm.f b/BLAS/SRC/sgemm.f
index ed5f3d0a6a..a93f44f284 100644
--- a/BLAS/SRC/sgemm.f
+++ b/BLAS/SRC/sgemm.f
@@ -40,13 +40,10 @@
 *>  operations are not performed. This results in the following NaN/Inf
 *>  propagation quirks:
 *>
-*>  1. If alpha is zero and beta is one, NaNs or Infs in A or B do not affect
-*>   the result.
+*>  1. If alpha is zero, NaNs or Infs in A or B do not affect the result.
 *>  2. If both alpha and beta are zero, then a zero matrix is returned in C,
 *>   irrespective of any NaNs or Infs in A, B or C.
-*>  3. If alpha is zero and beta is neither zero or one, then beta*C is
-*>   returned in C, irrespective of any NaNs or Infs in A or B.
-*>  4. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
+*>  3. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
 *>   of any NaNs or Infs in C.
 *> \endverbatim
 *
diff --git a/BLAS/SRC/zgemm.f b/BLAS/SRC/zgemm.f
index 9ad64f5ffa..a33a00ce8b 100644
--- a/BLAS/SRC/zgemm.f
+++ b/BLAS/SRC/zgemm.f
@@ -40,13 +40,10 @@
 *>  operations are not performed. This results in the following NaN/Inf
 *>  propagation quirks:
 *>
-*>  1. If alpha is zero and beta is one, NaNs or Infs in A or B do not affect
-*>   the result.
+*>  1. If alpha is zero, NaNs or Infs in A or B do not affect the result.
 *>  2. If both alpha and beta are zero, then a zero matrix is returned in C,
 *>   irrespective of any NaNs or Infs in A, B or C.
-*>  3. If alpha is zero and beta is neither zero or one, then beta*C is
-*>   returned in C, irrespective of any NaNs or Infs in A or B.
-*>  4. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
+*>  3. If only beta is zero, alpha*op( A )*op( B ) is returned, irrespective
 *>   of any NaNs or Infs in C.
 *> \endverbatim
 *