summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMiao Wang <miaowang@google.com>2015-06-29 17:29:43 -0700
committerMiao Wang <miaowang@google.com>2015-06-30 16:28:46 -0700
commit22cb808b0dfc9bd514d2e19b302a97f8455b5731 (patch)
tree2aa46f542560006777eb5ca68a338e7295d35559
parent7427a2546ecfa904cb4e580981f0419c628fc416 (diff)
downloadandroid_frameworks_rs-22cb808b0dfc9bd514d2e19b302a97f8455b5731.tar.gz
android_frameworks_rs-22cb808b0dfc9bd514d2e19b302a97f8455b5731.tar.bz2
android_frameworks_rs-22cb808b0dfc9bd514d2e19b302a97f8455b5731.zip
update the offset type for BLAS.BNNM
bug: 22184114 Change-Id: I6ec212f8d5feb46fc9d0f97862b206978af1675b
-rw-r--r--cpu_ref/rsCpuIntrinsicBLAS.cpp16
-rw-r--r--rsDefines.h8
2 files changed, 12 insertions, 12 deletions
diff --git a/cpu_ref/rsCpuIntrinsicBLAS.cpp b/cpu_ref/rsCpuIntrinsicBLAS.cpp
index 30344544..a7705b4e 100644
--- a/cpu_ref/rsCpuIntrinsicBLAS.cpp
+++ b/cpu_ref/rsCpuIntrinsicBLAS.cpp
@@ -47,10 +47,10 @@ protected:
uint8_t c_offset = 0;
static void kernelBNNM(size_t m, size_t n, size_t k,
- const uint8_t* a, uint32_t a_offset, size_t lda,
- const uint8_t* b, uint32_t b_offset, size_t ldb,
- uint8_t* c, uint32_t c_offset, size_t ldc,
- uint32_t c_mult_int);
+ const uint8_t* a, uint8_t a_offset, size_t lda,
+ const uint8_t* b, uint8_t b_offset, size_t ldb,
+ uint8_t* c, int32_t c_offset, size_t ldc,
+ int32_t c_mult_int);
@@ -653,10 +653,10 @@ void RsdCpuScriptIntrinsicBLAS::invokeForEach(uint32_t slot,
}
void RsdCpuScriptIntrinsicBLAS::kernelBNNM(size_t m, size_t n, size_t k,
- const uint8_t* a, uint32_t a_offset, size_t lda,
- const uint8_t* b, uint32_t b_offset, size_t ldb,
- uint8_t* c, uint32_t c_offset, size_t ldc,
- uint32_t c_mult_int) {
+ const uint8_t* a, uint8_t a_offset, size_t lda,
+ const uint8_t* b, uint8_t b_offset, size_t ldb,
+ uint8_t* c, int32_t c_offset, size_t ldc,
+ int32_t c_mult_int) {
// Calculations are done in 1.10.21 fixed-point format for the final output,
// just before there's a shift down to drop the fractional parts. The output
// values are gated to 0 to 255 to fit in a byte, but the 10-bit format
diff --git a/rsDefines.h b/rsDefines.h
index e00ddc19..4edda7af 100644
--- a/rsDefines.h
+++ b/rsDefines.h
@@ -460,10 +460,10 @@ typedef struct {
int incY;
int KL;
int KU;
- uint32_t a_offset;
- uint32_t b_offset;
- uint32_t c_offset;
- uint32_t c_mult_int;
+ uint8_t a_offset;
+ uint8_t b_offset;
+ int32_t c_offset;
+ int32_t c_mult_int;
} RsBlasCall;
enum RsGlobalProperty {