Skip to content

Commit

Permalink
Merge pull request #3399 from martin-frbg/issue2814
Browse files Browse the repository at this point in the history
Improve performance on Apple M1 Vortex
  • Loading branch information
martin-frbg committed Oct 7, 2021
2 parents 8e4c209 + 24233b7 commit b54b50f
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 3 deletions.
2 changes: 1 addition & 1 deletion kernel/arm64/KERNEL.VORTEX
@@ -1 +1 @@
include $(KERNELDIR)/KERNEL.ARMV8
include $(KERNELDIR)/KERNEL.NEOVERSEN1
4 changes: 2 additions & 2 deletions param.h
Expand Up @@ -2972,7 +2972,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#if defined(CORTEXA57) || \
defined(CORTEXA72) || defined(CORTEXA73) || \
defined(FALKOR) || defined(TSV110) || defined(EMAG8180)
defined(FALKOR) || defined(TSV110) || defined(EMAG8180) || defined(VORTEX)

#define SGEMM_DEFAULT_UNROLL_M 16
#define SGEMM_DEFAULT_UNROLL_N 4
Expand All @@ -2989,7 +2989,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
/*FIXME: this should be using the cache size, but there is currently no easy way to
query that on ARM. So if getarch counted more than 8 cores we simply assume the host
is a big desktop or server with abundant cache rather than a phone or embedded device */
#if NUM_CORES > 8 || defined(TSV110) || defined(EMAG8180)
#if NUM_CORES > 8 || defined(TSV110) || defined(EMAG8180) || defined(VORTEX)
#define SGEMM_DEFAULT_P 512
#define DGEMM_DEFAULT_P 256
#define CGEMM_DEFAULT_P 256
Expand Down

0 comments on commit b54b50f

Please sign in to comment.