diff options
-rw-r--r-- | cpu_ref/rsCpuIntrinsicBLAS.cpp | 16 | ||||
-rw-r--r-- | rsDefines.h | 8 |
2 files changed, 12 insertions, 12 deletions
diff --git a/cpu_ref/rsCpuIntrinsicBLAS.cpp b/cpu_ref/rsCpuIntrinsicBLAS.cpp index 30344544..a7705b4e 100644 --- a/cpu_ref/rsCpuIntrinsicBLAS.cpp +++ b/cpu_ref/rsCpuIntrinsicBLAS.cpp @@ -47,10 +47,10 @@ protected: uint8_t c_offset = 0; static void kernelBNNM(size_t m, size_t n, size_t k, - const uint8_t* a, uint32_t a_offset, size_t lda, - const uint8_t* b, uint32_t b_offset, size_t ldb, - uint8_t* c, uint32_t c_offset, size_t ldc, - uint32_t c_mult_int); + const uint8_t* a, uint8_t a_offset, size_t lda, + const uint8_t* b, uint8_t b_offset, size_t ldb, + uint8_t* c, int32_t c_offset, size_t ldc, + int32_t c_mult_int); @@ -653,10 +653,10 @@ void RsdCpuScriptIntrinsicBLAS::invokeForEach(uint32_t slot, } void RsdCpuScriptIntrinsicBLAS::kernelBNNM(size_t m, size_t n, size_t k, - const uint8_t* a, uint32_t a_offset, size_t lda, - const uint8_t* b, uint32_t b_offset, size_t ldb, - uint8_t* c, uint32_t c_offset, size_t ldc, - uint32_t c_mult_int) { + const uint8_t* a, uint8_t a_offset, size_t lda, + const uint8_t* b, uint8_t b_offset, size_t ldb, + uint8_t* c, int32_t c_offset, size_t ldc, + int32_t c_mult_int) { // Calculations are done in 1.10.21 fixed-point format for the final output, // just before there's a shift down to drop the fractional parts. The output // values are gated to 0 to 255 to fit in a byte, but the 10-bit format diff --git a/rsDefines.h b/rsDefines.h index e00ddc19..4edda7af 100644 --- a/rsDefines.h +++ b/rsDefines.h @@ -460,10 +460,10 @@ typedef struct { int incY; int KL; int KU; - uint32_t a_offset; - uint32_t b_offset; - uint32_t c_offset; - uint32_t c_mult_int; + uint8_t a_offset; + uint8_t b_offset; + int32_t c_offset; + int32_t c_mult_int; } RsBlasCall; enum RsGlobalProperty { |