sbgemm: spr: enlarge P to 256 for performance
authorWangyang Guo <wangyang.guo@intel.com>
Thu, 16 Sep 2021 03:29:49 +0000 (20:29 -0700)
committerWangyang Guo <wangyang.guo@intel.com>
Mon, 18 Oct 2021 02:08:03 +0000 (19:08 -0700)
param.h

diff --git a/param.h b/param.h
index c2c6916..23f406d 100644 (file)
--- a/param.h
+++ b/param.h
@@ -1781,7 +1781,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 // But for AMX, they are not the same, set UNROLL_M = 32 to workaround
 #define SBGEMM_DEFAULT_UNROLL_N 16
 #define SBGEMM_DEFAULT_UNROLL_M 32
-#define SBGEMM_DEFAULT_P 192
+#define SBGEMM_DEFAULT_P 256
 #define SBGEMM_DEFAULT_Q 1024
 #define SBGEMM_DEFAULT_R sbgemm_r