Skip to content

Commit

Permalink
sbgemm: spr: tuning for blocking params
Browse files Browse the repository at this point in the history
  • Loading branch information
guowangy committed Oct 18, 2021
1 parent a70bfb5 commit 0abbcd1
Showing 1 changed file with 14 additions and 0 deletions.
14 changes: 14 additions & 0 deletions param.h
Expand Up @@ -1771,6 +1771,20 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
#endif
#define USE_SGEMM_KERNEL_DIRECT 1

#undef SBGEMM_DEFAULT_UNROLL_N
#undef SBGEMM_DEFAULT_UNROLL_M
#undef SBGEMM_DEFAULT_P
#undef SBGEMM_DEFAULT_R
#undef SBGEMM_DEFAULT_Q
// FIXME: actually UNROLL_M = UNROLL_N = 16
// If M and N is equal, OpenBLAS will reuse OCOPY as ICOPY.
// But for AMX, they are not the same, set UNROLL_M = 32 to workaround
#define SBGEMM_DEFAULT_UNROLL_N 16
#define SBGEMM_DEFAULT_UNROLL_M 32
#define SBGEMM_DEFAULT_P 192
#define SBGEMM_DEFAULT_Q 1024
#define SBGEMM_DEFAULT_R sbgemm_r

#ifdef ARCH_X86

#define SGEMM_DEFAULT_UNROLL_M 4
Expand Down

0 comments on commit 0abbcd1

Please sign in to comment.