Add casting.
This commit is contained in:
parent
7ec3c16d82
commit
915a6d6e44
|
@ -121,12 +121,12 @@ FORCEINLINE void copy_x(BLASLONG n, IFLOAT *src, IFLOAT *dest, BLASLONG inc_src)
|
||||||
|
|
||||||
FORCEINLINE void copy_y_beta(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_src, FLOAT beta)
|
FORCEINLINE void copy_y_beta(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_src, FLOAT beta)
|
||||||
{
|
{
|
||||||
if (beta == 0) {
|
if (beta == (FLOAT)0) {
|
||||||
for (BLASLONG i = 0; i < n; i++) {
|
for (BLASLONG i = 0; i < n; i++) {
|
||||||
*dest++ = (FLOAT)0;
|
*dest++ = (FLOAT)0;
|
||||||
src += inc_src;
|
src += inc_src;
|
||||||
}
|
}
|
||||||
} else if (beta == 1) {
|
} else if (beta == (FLOAT)1) {
|
||||||
for (BLASLONG i = 0; i < n; i++) {
|
for (BLASLONG i = 0; i < n; i++) {
|
||||||
*dest++ = *src;
|
*dest++ = *src;
|
||||||
src += inc_src;
|
src += inc_src;
|
||||||
|
@ -141,12 +141,12 @@ FORCEINLINE void copy_y_beta(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_s
|
||||||
|
|
||||||
FORCEINLINE void copy_y(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_src, FLOAT beta)
|
FORCEINLINE void copy_y(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_src, FLOAT beta)
|
||||||
{
|
{
|
||||||
if (beta == 0) {
|
if (beta == (FLOAT)0) {
|
||||||
for (BLASLONG i = 0; i < n; i++) {
|
for (BLASLONG i = 0; i < n; i++) {
|
||||||
*dest = *src++;
|
*dest = *src++;
|
||||||
dest += inc_src;
|
dest += inc_src;
|
||||||
}
|
}
|
||||||
} else if (beta == 1) {
|
} else if (beta == (FLOAT)1) {
|
||||||
for (BLASLONG i = 0; i < n; i++) {
|
for (BLASLONG i = 0; i < n; i++) {
|
||||||
*dest += *src++;
|
*dest += *src++;
|
||||||
dest += inc_src;
|
dest += inc_src;
|
||||||
|
@ -169,9 +169,9 @@ FORCEINLINE void move_y(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_dest)
|
||||||
|
|
||||||
static void BF16GEMV_N_beta(BLASLONG n, FLOAT *output_vector, FLOAT *input_vector, FLOAT beta)
|
static void BF16GEMV_N_beta(BLASLONG n, FLOAT *output_vector, FLOAT *input_vector, FLOAT beta)
|
||||||
{
|
{
|
||||||
if (beta == 0) {
|
if (beta == (FLOAT)0) {
|
||||||
memset(output_vector, 0, sizeof(FLOAT) * n);
|
memset(output_vector, 0, sizeof(FLOAT) * n);
|
||||||
} else if (beta == 1) {
|
} else if (beta == (FLOAT)1) {
|
||||||
if (output_vector != input_vector) {
|
if (output_vector != input_vector) {
|
||||||
memcpy(output_vector, input_vector, sizeof(FLOAT) * n);
|
memcpy(output_vector, input_vector, sizeof(FLOAT) * n);
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue