@@ -459,9 +459,9 @@ void sgemm_4x16_pack_A_n(float * outptr, const float * inptr, int ldin, int y0, | |||
switch ((y + 3) - ymax) { | |||
/* Everything falls through in here */ | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -478,9 +478,9 @@ void sgemm_4x16_pack_A_n(float * outptr, const float * inptr, int ldin, int y0, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -676,9 +676,9 @@ void sgemm_4x16_pack_B_t(float* out, const float* in, int ldin, | |||
switch ((y + 3) - ymax) { | |||
/* Everything falls through in here */ | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -696,9 +696,9 @@ void sgemm_4x16_pack_B_t(float* out, const float* in, int ldin, | |||
switch ((y + 3) - ymax) { | |||
/* Everything falls through in here */ | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -964,9 +964,9 @@ void sgemm_8x12_pack_A_n(float* outptr, const float* inptr, int ldin, int y0, | |||
switch ((y + 3) - ymax) { | |||
/* Everything falls through in here */ | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -983,9 +983,9 @@ void sgemm_8x12_pack_A_n(float* outptr, const float* inptr, int ldin, int y0, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1204,9 +1204,9 @@ void sgemm_8x12_pack_B_t(float* out, const float* in, int ldin, | |||
switch ((y + 3) - ymax) { | |||
/* Everything falls through in here */ | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1224,9 +1224,9 @@ void sgemm_8x12_pack_B_t(float* out, const float* in, int ldin, | |||
switch ((y + 3) - ymax) { | |||
/* Everything falls through in here */ | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -975,9 +975,9 @@ static void gemm_s16_12x8x1_pack_A_n(int16_t* outptr, const int16_t* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -992,9 +992,9 @@ static void gemm_s16_12x8x1_pack_A_n(int16_t* outptr, const int16_t* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1136,9 +1136,9 @@ static void gemm_s16_12x8x1_transpose_pack_B_n(int16_t* outptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1153,9 +1153,9 @@ static void gemm_s16_12x8x1_transpose_pack_B_n(int16_t* outptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -717,9 +717,9 @@ static void gemm_s8_4x4_pack_A_n(dt_int8* outptr, const dt_int8* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -735,9 +735,9 @@ static void gemm_s8_4x4_pack_A_n(dt_int8* outptr, const dt_int8* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -778,19 +778,19 @@ static void gemm_s8_4x4_pack_B_n(dt_int8* out, const dt_int8* in, int ldin, | |||
if (remain >= 0) { | |||
switch (remain) { | |||
case 7: | |||
inptr0 = zerobuff; | |||
inptr0 = zerobuff; MEGDNN_FALLTHRU | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -809,19 +809,19 @@ static void gemm_s8_4x4_pack_B_n(dt_int8* out, const dt_int8* in, int ldin, | |||
if (remain >= 0) { | |||
switch (remain) { | |||
case 7: | |||
inptr0 = zerobuff; | |||
inptr0 = zerobuff; MEGDNN_FALLTHRU | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -992,9 +992,9 @@ static void gemm_s8_8x8_pack_A_n(int8_t* outptr, const int8_t* inptr, int ldin, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1010,9 +1010,9 @@ static void gemm_s8_8x8_pack_A_n(int8_t* outptr, const int8_t* inptr, int ldin, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1064,17 +1064,17 @@ static void gemm_s8_8x8_transpose_pack_A_n(int8_t* out, const int8_t* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1092,17 +1092,17 @@ static void gemm_s8_8x8_transpose_pack_A_n(int8_t* out, const int8_t* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1120,17 +1120,17 @@ static void gemm_s8_8x8_transpose_pack_A_n(int8_t* out, const int8_t* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1187,17 +1187,17 @@ static void gemm_s8_8x8_pack_B_n(int8_t* out, const int8_t* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1216,17 +1216,17 @@ static void gemm_s8_8x8_pack_B_n(int8_t* out, const int8_t* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1245,17 +1245,17 @@ static void gemm_s8_8x8_pack_B_n(int8_t* out, const int8_t* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1332,9 +1332,9 @@ static void gemm_s8_8x8_transpose_pack_B_n(int8_t* outptr, const int8_t* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1351,9 +1351,9 @@ static void gemm_s8_8x8_transpose_pack_B_n(int8_t* outptr, const int8_t* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -846,9 +846,9 @@ static void gemm_mk4_s8_4x4_pack_B(dt_int8* out, const dt_int8* in, int ldin, | |||
if (k + 3 >= ICB) { | |||
switch (k + 3 - ICB) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -863,9 +863,9 @@ static void gemm_mk4_s8_4x4_pack_B(dt_int8* out, const dt_int8* in, int ldin, | |||
if (k + 3 >= ICB) { | |||
switch (k + 3 - ICB) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -292,9 +292,9 @@ static void gemm_s8x8x16_4x4_pack_A_n(dt_int8* outptr, const dt_int8* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -309,9 +309,9 @@ static void gemm_s8x8x16_4x4_pack_A_n(dt_int8* outptr, const dt_int8* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -362,19 +362,19 @@ static void gemm_s8x8x16_4x4_pack_B_n(dt_int8* out, const dt_int8* in, int ldin, | |||
if (remain >= 0) { | |||
switch (remain) { | |||
case 7: | |||
inptr0 = zerobuff; | |||
inptr0 = zerobuff; MEGDNN_FALLTHRU | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -393,19 +393,19 @@ static void gemm_s8x8x16_4x4_pack_B_n(dt_int8* out, const dt_int8* in, int ldin, | |||
if (remain >= 0) { | |||
switch (remain) { | |||
case 7: | |||
inptr0 = zerobuff; | |||
inptr0 = zerobuff; MEGDNN_FALLTHRU | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -918,9 +918,9 @@ static void gemm_s8x8x16_8x8_pack_A_n(dt_int8* outptr, const dt_int8* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -936,9 +936,9 @@ static void gemm_s8x8x16_8x8_pack_A_n(dt_int8* outptr, const dt_int8* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -991,17 +991,17 @@ static void gemm_s8x8x16_8x8_transpose_pack_A_n(dt_int8* out, const dt_int8* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1019,17 +1019,17 @@ static void gemm_s8x8x16_8x8_transpose_pack_A_n(dt_int8* out, const dt_int8* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1047,17 +1047,17 @@ static void gemm_s8x8x16_8x8_transpose_pack_A_n(dt_int8* out, const dt_int8* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1113,17 +1113,17 @@ static void gemm_s8x8x16_8x8_pack_B_n(dt_int8* out, const dt_int8* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1142,17 +1142,17 @@ static void gemm_s8x8x16_8x8_pack_B_n(dt_int8* out, const dt_int8* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1171,17 +1171,17 @@ static void gemm_s8x8x16_8x8_pack_B_n(dt_int8* out, const dt_int8* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1259,9 +1259,9 @@ static void gemm_s8x8x16_8x8_transpose_pack_B_n(dt_int8* outptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1278,9 +1278,9 @@ static void gemm_s8x8x16_8x8_transpose_pack_B_n(dt_int8* outptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1011,9 +1011,9 @@ static void gemm_u8_8x8_pack_A_n(dt_uint8* outptr, const dt_uint8* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1029,9 +1029,9 @@ static void gemm_u8_8x8_pack_A_n(dt_uint8* outptr, const dt_uint8* inptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1084,17 +1084,17 @@ static void gemm_u8_8x8_transpose_pack_A_n(dt_uint8* out, const dt_uint8* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1112,17 +1112,17 @@ static void gemm_u8_8x8_transpose_pack_A_n(dt_uint8* out, const dt_uint8* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1140,17 +1140,17 @@ static void gemm_u8_8x8_transpose_pack_A_n(dt_uint8* out, const dt_uint8* in, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1208,17 +1208,17 @@ static void gemm_u8_8x8_pack_B_n(dt_uint8* out, const dt_uint8* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1237,17 +1237,17 @@ static void gemm_u8_8x8_pack_B_n(dt_uint8* out, const dt_uint8* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1266,17 +1266,17 @@ static void gemm_u8_8x8_pack_B_n(dt_uint8* out, const dt_uint8* in, int ldin, | |||
if (k + 7 >= kmax) { | |||
switch (k + 7 - kmax) { | |||
case 6: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 5: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 4: | |||
inptr3 = zerobuff; | |||
inptr3 = zerobuff; MEGDNN_FALLTHRU | |||
case 3: | |||
inptr4 = zerobuff; | |||
inptr4 = zerobuff; MEGDNN_FALLTHRU | |||
case 2: | |||
inptr5 = zerobuff; | |||
inptr5 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr6 = zerobuff; | |||
inptr6 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr7 = zerobuff; | |||
break; | |||
@@ -1354,9 +1354,9 @@ static void gemm_u8_8x8_transpose_pack_B_n(dt_uint8* outptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -1373,9 +1373,9 @@ static void gemm_u8_8x8_transpose_pack_B_n(dt_uint8* outptr, | |||
if (y + 3 >= ymax) { | |||
switch (y + 3 - ymax) { | |||
case 2: | |||
inptr1 = zerobuff; | |||
inptr1 = zerobuff; MEGDNN_FALLTHRU | |||
case 1: | |||
inptr2 = zerobuff; | |||
inptr2 = zerobuff; MEGDNN_FALLTHRU | |||
case 0: | |||
inptr3 = zerobuff; | |||
break; | |||
@@ -27,9 +27,9 @@ namespace arm_common { | |||
vreinterpret_s32_s8(vres), idx / 4); \ | |||
break; \ | |||
case 3: \ | |||
vst1_lane_s8(C + 2, vres, idx + 2); \ | |||
vst1_lane_s8(C + 2, vres, idx + 2); MEGDNN_FALLTHRU\ | |||
case 2: \ | |||
vst1_lane_s8(C + 1, vres, idx + 1); \ | |||
vst1_lane_s8(C + 1, vres, idx + 1); MEGDNN_FALLTHRU\ | |||
case 1: \ | |||
vst1_lane_s8(C + 0, vres, idx + 0); \ | |||
break; \ | |||
@@ -44,9 +44,9 @@ namespace arm_common { | |||
vreinterpret_s32_u8(vres), idx / 4); \ | |||
break; \ | |||
case 3: \ | |||
vst1_lane_u8(C + 2, vres, idx + 2); \ | |||
vst1_lane_u8(C + 2, vres, idx + 2); MEGDNN_FALLTHRU\ | |||
case 2: \ | |||
vst1_lane_u8(C + 1, vres, idx + 1); \ | |||
vst1_lane_u8(C + 1, vres, idx + 1); MEGDNN_FALLTHRU\ | |||
case 1: \ | |||
vst1_lane_u8(C + 0, vres, idx + 0); \ | |||
break; \ | |||