Special case for alpha=1 in saxpy, slight performance increase.

This commit is contained in:
Tomasz Sobczyk
2020-11-25 22:13:11 +01:00
committed by nodchip
parent 49b2dcb1f3
commit 8009973381

View File

@@ -177,10 +177,19 @@ namespace Blas {
float * SF_BLAS_RESTRICT Y
)
{
for(int i = 0; i < N; ++i)
if (alpha == 1.0f)
{
Y[i] += X[i] * alpha;
for (int i = 0; i < N; ++i)
{
Y[i] += X[i];
}
}
else
{
for (int i = 0; i < N; ++i)
{
Y[i] += X[i] * alpha;
}
}
}