61 {
62#if defined(__i386__) || defined(_M_IX86) || defined(__x86_64__) || defined(_M_X64)
63#if !defined(_MSC_VER) || (defined(_MSC_VER) && defined(__clang__) && !defined(__c2__))
64 static const auto __cpuidex = [](int *cpuInfo, int func1, int func2) {
65 __asm__ __volatile__("cpuid\n\t" : "=a"(cpuInfo[0]), "=b"(cpuInfo[1]), "=c"(cpuInfo[2]), "=d"(cpuInfo[3]) : "a"(func1), "c"(func2));
66 };
67
68 static const auto _mm_clwb = [](const void *addr) { __asm__ __volatile__(".byte 0x66, 0x0f, 0xae, 0x30\n\t" : : "a"(addr)); };
69 static const auto _mm_clflushopt = [](const void *addr) { __asm__ __volatile__("clflushopt (%0)\n\t" : : "r"(addr)); };
70 static const auto _mm_clflush = [](const void *addr) { __asm__ __volatile__("clflush (%0)\n\t" : : "r"(addr)); };
71 static const auto _mm_sfence = []() { __asm__ __volatile__("sfence\n\t"); };
72#endif
73 int nBuff[4];
74 __cpuidex(nBuff, 0x7, 0x0);
75 if(nBuff[1] & (1 << 24))
76 {
77 return [](
const void *addr,
size_t bytes,
memory_flush kind) -> memory_flush {
78 if(kind == memory_flush_retain)
79 {
80 while(bytes > 0)
81 {
82 _mm_clwb(addr);
83 addr = (void *) ((uintptr_t) addr + 64);
84 bytes -= 64;
85 }
86 _mm_sfence();
88 }
89 while(bytes > 0)
90 {
91 _mm_clflushopt(addr);
92 addr = (void *) ((uintptr_t) addr + 64);
93 bytes -= 64;
94 }
95 _mm_sfence();
97 };
98 }
99 if(nBuff[1] & (1 << 23))
100 {
101 return [](
const void *addr,
size_t bytes,
memory_flush ) -> memory_flush {
102 while(bytes > 0)
103 {
104 _mm_clflushopt(addr);
105 addr = (void *) ((uintptr_t) addr + 64);
106 bytes -= 64;
107 }
108 _mm_sfence();
110 };
111 }
112 else
113 {
114
115 return [](
const void *addr,
size_t bytes,
memory_flush ) -> memory_flush {
116 while(bytes > 0)
117 {
118 _mm_clflush(addr);
119 addr = (void *) ((uintptr_t) addr + 64);
120 bytes -= 64;
121 }
123 };
124 }
125#elif defined(__aarch64__) || defined(_M_ARM64)
126#if !defined(_MSC_VER) || (defined(_MSC_VER) && defined(__clang__) && !defined(__c2__))
127 static const auto _dmb_ish = []() { __asm__ __volatile__("dmb ish" : : : "memory"); };
128 static const auto _dc_cvac = [](const void *addr) { __asm__ __volatile__("dc cvac, %0" : : "r"(addr) : "memory"); };
129 static const auto _dc_civac = [](const void *addr) { __asm__ __volatile__("dc civac, %0" : : "r"(addr) : "memory"); };
130#else
131 static const auto _dmb_ish = []() { __dmb(_ARM64_BARRIER_ISH); };
132 static const auto _dc_cvac = [](const void *addr) {
133 (void) addr;
134 abort();
135 };
136 static const auto _dc_civac = [](const void *addr) {
137 (void) addr;
138 abort();
139 };
140#endif
141 return [](
const void *addr,
size_t bytes,
memory_flush kind) -> memory_flush {
142 if(kind == memory_flush_retain)
143 {
144 while(bytes > 0)
145 {
146 _dc_cvac(addr);
147 addr = (void *) ((uintptr_t) addr + 64);
148 bytes -= 64;
149 }
150 _dmb_ish();
152 }
153 while(bytes > 0)
154 {
155 _dc_civac(addr);
156 addr = (void *) ((uintptr_t) addr + 64);
157 bytes -= 64;
158 }
159 _dmb_ish();
161 };
162#elif defined(__arm__) || defined(_M_ARM)
163#if !defined(_MSC_VER) || (defined(_MSC_VER) && defined(__clang__) && !defined(__c2__))
164#undef _MoveToCoprocessor
165#define _MoveToCoprocessor(value, coproc, opcode1, crn, crm, opcode2) \
166 __asm__ __volatile__("MCR p" #coproc ", " #opcode1 ", %0, c" #crn ", c" #crm ", " #opcode2 : : "r"(value) : "memory");
167#endif
168 return [](
const void *addr,
size_t bytes,
memory_flush kind) -> memory_flush {
169 if(kind == memory_flush_retain)
170 {
171 while(bytes > 0)
172 {
173
174 _MoveToCoprocessor(addr, 15, 0, 7, 10, 1);
175 addr = (void *) ((uintptr_t) addr + 64);
176 bytes -= 64;
177 }
178
179 _MoveToCoprocessor(0, 15, 0, 7, 10, 5);
181 }
182 while(bytes > 0)
183 {
184
185 _MoveToCoprocessor(addr, 15, 0, 7, 14, 1);
186 addr = (void *) ((uintptr_t) addr + 64);
187 bytes -= 64;
188 }
189
190 _MoveToCoprocessor(0, 15, 0, 7, 10, 5);
192 };
193#else
194#error Unsupported platform
195#endif
196 }
constexpr memory_flush memory_flush_retain
Flush modified cache line to memory, but retain as unmodified in cache.
Definition mem_flush_loads_stores.hpp:53
constexpr memory_flush memory_flush_evict
Flush modified cache line to memory, and evict completely from all caches.
Definition mem_flush_loads_stores.hpp:55
memory_flush
The kinds of cache line flushing which can be performed.
Definition mem_flush_loads_stores.hpp:45