-
Notifications
You must be signed in to change notification settings - Fork 724
/
patch-libs_ardour_sse__functions__avx__linux.cc
84 lines (84 loc) · 4 KB
/
patch-libs_ardour_sse__functions__avx__linux.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
--- libs/ardour/sse_functions_avx_linux.cc.orig 2023-02-21 01:17:58 UTC
+++ libs/ardour/sse_functions_avx_linux.cc
@@ -106,7 +106,7 @@ x86_sse_avx_compute_peak(const float *src, uint32_t nf
while (nframes >= 32)
{
#ifdef _WIN32
- _mm_prefetch(reinterpret_cast<char const *>(src + 32), _mm_hint(0));
+ _mm_prefetch(reinterpret_cast<char const *>(src + 32), _MM_HINT_NTA);
#else
__builtin_prefetch(reinterpret_cast<void const *>(src + 32), 0, 0);
#endif
@@ -196,7 +196,7 @@ x86_sse_avx_find_peaks(const float *src, uint32_t nfra
while (nframes >= 32)
{
#ifdef _WIN32
- _mm_prefetch(reinterpret_cast<char const *>(src + 32), _mm_hint(0));
+ _mm_prefetch(reinterpret_cast<char const *>(src + 32), _MM_HINT_NTA);
#else
__builtin_prefetch(reinterpret_cast<void const *>(src + 32), 0, 0);
#endif
@@ -278,7 +278,7 @@ x86_sse_avx_apply_gain_to_buffer(float *dst, uint32_t
while (frames >= 16)
{
#if defined(COMPILER_MSVC) || defined(COMPILER_MINGW)
- _mm_prefetch(((char *)dst + (16 * sizeof(float))), _mm_hint(0));
+ _mm_prefetch(((char *)dst + (16 * sizeof(float))), _MM_HINT_NTA);
#else
__builtin_prefetch(reinterpret_cast<void const *>(dst + 16), 0, 0);
#endif
@@ -410,8 +410,8 @@ x86_sse_avx_mix_buffers_with_gain_unaligned(float *dst
while (nframes >= 16)
{
#if defined(COMPILER_MSVC) || defined(COMPILER_MINGW)
- _mm_prefetch(((char *)dst + (16 * sizeof(float))), _mm_hint(0));
- _mm_prefetch(((char *)src + (16 * sizeof(float))), _mm_hint(0));
+ _mm_prefetch(((char *)dst + (16 * sizeof(float))), _MM_HINT_NTA);
+ _mm_prefetch(((char *)src + (16 * sizeof(float))), _MM_HINT_NTA);
#else
__builtin_prefetch(reinterpret_cast<void const *>(src + 16), 0, 0);
__builtin_prefetch(reinterpret_cast<void const *>(dst + 16), 0, 0);
@@ -503,8 +503,8 @@ x86_sse_avx_mix_buffers_with_gain_aligned(float *dst,
while (nframes >= 16)
{
#if defined(COMPILER_MSVC) || defined(COMPILER_MINGW)
- _mm_prefetch(((char *)dst + (16 * sizeof(float))), _mm_hint(0));
- _mm_prefetch(((char *)src + (16 * sizeof(float))), _mm_hint(0));
+ _mm_prefetch(((char *)dst + (16 * sizeof(float))), _MM_HINT_NTA);
+ _mm_prefetch(((char *)src + (16 * sizeof(float))), _MM_HINT_NTA);
#else
__builtin_prefetch(reinterpret_cast<void const *>(src + 16), 0, 0);
__builtin_prefetch(reinterpret_cast<void const *>(dst + 16), 0, 0);
@@ -592,8 +592,8 @@ x86_sse_avx_mix_buffers_no_gain_unaligned(float *dst,
while (nframes >= 16)
{
#if defined(COMPILER_MSVC) || defined(COMPILER_MINGW)
- _mm_prefetch(((char *)dst + (16 * sizeof(float))), _mm_hint(0));
- _mm_prefetch(((char *)src + (16 * sizeof(float))), _mm_hint(0));
+ _mm_prefetch(((char *)dst + (16 * sizeof(float))), _MM_HINT_NTA);
+ _mm_prefetch(((char *)src + (16 * sizeof(float))), _MM_HINT_NTA);
#else
__builtin_prefetch(reinterpret_cast<void const *>(src + 16), 0, 0);
__builtin_prefetch(reinterpret_cast<void const *>(dst + 16), 0, 0);
@@ -674,8 +674,8 @@ x86_sse_avx_mix_buffers_no_gain_aligned(float *dst, co
while (nframes >= 32)
{
#if defined(COMPILER_MSVC) || defined(COMPILER_MINGW)
- _mm_prefetch(((char *)dst + (32 * sizeof(float))), _mm_hint(0));
- _mm_prefetch(((char *)src + (32 * sizeof(float))), _mm_hint(0));
+ _mm_prefetch(((char *)dst + (32 * sizeof(float))), _MM_HINT_NTA);
+ _mm_prefetch(((char *)src + (32 * sizeof(float))), _MM_HINT_NTA);
#else
__builtin_prefetch(reinterpret_cast<void const *>(src + 32), 0, 0);
__builtin_prefetch(reinterpret_cast<void const *>(dst + 32), 0, 0);
@@ -717,8 +717,8 @@ x86_sse_avx_mix_buffers_no_gain_aligned(float *dst, co
while (nframes >= 16)
{
#if defined(COMPILER_MSVC) || defined(COMPILER_MINGW)
- _mm_prefetch(((char *)dst + (16 * sizeof(float))), _mm_hint(0));
- _mm_prefetch(((char *)src + (16 * sizeof(float))), _mm_hint(0));
+ _mm_prefetch(((char *)dst + (16 * sizeof(float))), _MM_HINT_NTA);
+ _mm_prefetch(((char *)src + (16 * sizeof(float))), _MM_HINT_NTA);
#else
__builtin_prefetch(reinterpret_cast<void const *>(src + 16), 0, 0);
__builtin_prefetch(reinterpret_cast<void const *>(dst + 16), 0, 0);