13cab2bb3Spatrick //===-- clear_cache.c - Implement __clear_cache ---------------------------===// 23cab2bb3Spatrick // 33cab2bb3Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 43cab2bb3Spatrick // See https://llvm.org/LICENSE.txt for license information. 53cab2bb3Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 63cab2bb3Spatrick // 73cab2bb3Spatrick //===----------------------------------------------------------------------===// 83cab2bb3Spatrick 93cab2bb3Spatrick #include "int_lib.h" 103cab2bb3Spatrick #include <assert.h> 113cab2bb3Spatrick #include <stddef.h> 123cab2bb3Spatrick 133cab2bb3Spatrick #if __APPLE__ 143cab2bb3Spatrick #include <libkern/OSCacheControl.h> 153cab2bb3Spatrick #endif 163cab2bb3Spatrick 173cab2bb3Spatrick #if defined(_WIN32) 183cab2bb3Spatrick // Forward declare Win32 APIs since the GCC mode driver does not handle the 193cab2bb3Spatrick // newer SDKs as well as needed. 203cab2bb3Spatrick uint32_t FlushInstructionCache(uintptr_t hProcess, void *lpBaseAddress, 213cab2bb3Spatrick uintptr_t dwSize); 223cab2bb3Spatrick uintptr_t GetCurrentProcess(void); 233cab2bb3Spatrick #endif 243cab2bb3Spatrick 253cab2bb3Spatrick #if defined(__FreeBSD__) && defined(__arm__) 263cab2bb3Spatrick // clang-format off 273cab2bb3Spatrick #include <sys/types.h> 283cab2bb3Spatrick #include <machine/sysarch.h> 293cab2bb3Spatrick // clang-format on 303cab2bb3Spatrick #endif 313cab2bb3Spatrick 323cab2bb3Spatrick #if defined(__NetBSD__) && defined(__arm__) 333cab2bb3Spatrick #include <machine/sysarch.h> 343cab2bb3Spatrick #endif 353cab2bb3Spatrick 36e655f019Spatrick #if defined(__OpenBSD__) && (defined(__arm__) || defined(__mips__)) 373cab2bb3Spatrick // clang-format off 383cab2bb3Spatrick #include <sys/types.h> 393cab2bb3Spatrick #include <machine/sysarch.h> 403cab2bb3Spatrick // clang-format on 413cab2bb3Spatrick #endif 423cab2bb3Spatrick 433cab2bb3Spatrick #if defined(__linux__) && defined(__mips__) 443cab2bb3Spatrick #include <sys/cachectl.h> 453cab2bb3Spatrick #include <sys/syscall.h> 463cab2bb3Spatrick #include <unistd.h> 473cab2bb3Spatrick #endif 483cab2bb3Spatrick 493cab2bb3Spatrick // The compiler generates calls to __clear_cache() when creating 503cab2bb3Spatrick // trampoline functions on the stack for use with nested functions. 513cab2bb3Spatrick // It is expected to invalidate the instruction cache for the 523cab2bb3Spatrick // specified range. 533cab2bb3Spatrick 543cab2bb3Spatrick void __clear_cache(void *start, void *end) { 553cab2bb3Spatrick #if __i386__ || __x86_64__ || defined(_M_IX86) || defined(_M_X64) 563cab2bb3Spatrick // Intel processors have a unified instruction and data cache 573cab2bb3Spatrick // so there is nothing to do 583cab2bb3Spatrick #elif defined(_WIN32) && (defined(__arm__) || defined(__aarch64__)) 593cab2bb3Spatrick FlushInstructionCache(GetCurrentProcess(), start, end - start); 603cab2bb3Spatrick #elif defined(__arm__) && !defined(__APPLE__) 61e655f019Spatrick #if defined(__FreeBSD__) || defined(__NetBSD__) || defined(__OpenBSD__) 623cab2bb3Spatrick struct arm_sync_icache_args arg; 633cab2bb3Spatrick 643cab2bb3Spatrick arg.addr = (uintptr_t)start; 653cab2bb3Spatrick arg.len = (uintptr_t)end - (uintptr_t)start; 663cab2bb3Spatrick 673cab2bb3Spatrick sysarch(ARM_SYNC_ICACHE, &arg); 683cab2bb3Spatrick #elif defined(__linux__) 693cab2bb3Spatrick // We used to include asm/unistd.h for the __ARM_NR_cacheflush define, but 703cab2bb3Spatrick // it also brought many other unused defines, as well as a dependency on 713cab2bb3Spatrick // kernel headers to be installed. 723cab2bb3Spatrick // 733cab2bb3Spatrick // This value is stable at least since Linux 3.13 and should remain so for 743cab2bb3Spatrick // compatibility reasons, warranting it's re-definition here. 753cab2bb3Spatrick #define __ARM_NR_cacheflush 0x0f0002 763cab2bb3Spatrick register int start_reg __asm("r0") = (int)(intptr_t)start; 773cab2bb3Spatrick const register int end_reg __asm("r1") = (int)(intptr_t)end; 783cab2bb3Spatrick const register int flags __asm("r2") = 0; 793cab2bb3Spatrick const register int syscall_nr __asm("r7") = __ARM_NR_cacheflush; 803cab2bb3Spatrick __asm __volatile("svc 0x0" 813cab2bb3Spatrick : "=r"(start_reg) 823cab2bb3Spatrick : "r"(syscall_nr), "r"(start_reg), "r"(end_reg), "r"(flags)); 833cab2bb3Spatrick assert(start_reg == 0 && "Cache flush syscall failed."); 843cab2bb3Spatrick #else 853cab2bb3Spatrick compilerrt_abort(); 863cab2bb3Spatrick #endif 873cab2bb3Spatrick #elif defined(__linux__) && defined(__mips__) 883cab2bb3Spatrick const uintptr_t start_int = (uintptr_t)start; 893cab2bb3Spatrick const uintptr_t end_int = (uintptr_t)end; 903cab2bb3Spatrick syscall(__NR_cacheflush, start, (end_int - start_int), BCACHE); 913cab2bb3Spatrick #elif defined(__mips__) && defined(__OpenBSD__) 923cab2bb3Spatrick cacheflush(start, (uintptr_t)end - (uintptr_t)start, BCACHE); 933cab2bb3Spatrick #elif defined(__aarch64__) && !defined(__APPLE__) 943cab2bb3Spatrick uint64_t xstart = (uint64_t)(uintptr_t)start; 953cab2bb3Spatrick uint64_t xend = (uint64_t)(uintptr_t)end; 963cab2bb3Spatrick 973cab2bb3Spatrick // Get Cache Type Info. 983cab2bb3Spatrick static uint64_t ctr_el0 = 0; 993cab2bb3Spatrick if (ctr_el0 == 0) 1003cab2bb3Spatrick __asm __volatile("mrs %0, ctr_el0" : "=r"(ctr_el0)); 1013cab2bb3Spatrick 1023cab2bb3Spatrick // The DC and IC instructions must use 64-bit registers so we don't use 1033cab2bb3Spatrick // uintptr_t in case this runs in an IPL32 environment. 1043cab2bb3Spatrick uint64_t addr; 1053cab2bb3Spatrick 1063cab2bb3Spatrick // If CTR_EL0.IDC is set, data cache cleaning to the point of unification 1073cab2bb3Spatrick // is not required for instruction to data coherence. 1083cab2bb3Spatrick if (((ctr_el0 >> 28) & 0x1) == 0x0) { 1093cab2bb3Spatrick const size_t dcache_line_size = 4 << ((ctr_el0 >> 16) & 15); 1103cab2bb3Spatrick for (addr = xstart & ~(dcache_line_size - 1); addr < xend; 1113cab2bb3Spatrick addr += dcache_line_size) 1123cab2bb3Spatrick __asm __volatile("dc cvau, %0" ::"r"(addr)); 1133cab2bb3Spatrick } 1143cab2bb3Spatrick __asm __volatile("dsb ish"); 1153cab2bb3Spatrick 1163cab2bb3Spatrick // If CTR_EL0.DIC is set, instruction cache invalidation to the point of 1173cab2bb3Spatrick // unification is not required for instruction to data coherence. 1183cab2bb3Spatrick if (((ctr_el0 >> 29) & 0x1) == 0x0) { 1193cab2bb3Spatrick const size_t icache_line_size = 4 << ((ctr_el0 >> 0) & 15); 1203cab2bb3Spatrick for (addr = xstart & ~(icache_line_size - 1); addr < xend; 1213cab2bb3Spatrick addr += icache_line_size) 1223cab2bb3Spatrick __asm __volatile("ic ivau, %0" ::"r"(addr)); 1233cab2bb3Spatrick } 1243cab2bb3Spatrick __asm __volatile("isb sy"); 1253cab2bb3Spatrick #elif defined(__powerpc64__) 1263cab2bb3Spatrick const size_t line_size = 32; 1273cab2bb3Spatrick const size_t len = (uintptr_t)end - (uintptr_t)start; 1283cab2bb3Spatrick 1293cab2bb3Spatrick const uintptr_t mask = ~(line_size - 1); 1303cab2bb3Spatrick const uintptr_t start_line = ((uintptr_t)start) & mask; 1313cab2bb3Spatrick const uintptr_t end_line = ((uintptr_t)start + len + line_size - 1) & mask; 1323cab2bb3Spatrick 1333cab2bb3Spatrick for (uintptr_t line = start_line; line < end_line; line += line_size) 1343cab2bb3Spatrick __asm__ volatile("dcbf 0, %0" : : "r"(line)); 1353cab2bb3Spatrick __asm__ volatile("sync"); 1363cab2bb3Spatrick 1373cab2bb3Spatrick for (uintptr_t line = start_line; line < end_line; line += line_size) 1383cab2bb3Spatrick __asm__ volatile("icbi 0, %0" : : "r"(line)); 1393cab2bb3Spatrick __asm__ volatile("isync"); 1403cab2bb3Spatrick #elif defined(__sparc__) 1413cab2bb3Spatrick const size_t dword_size = 8; 1423cab2bb3Spatrick const size_t len = (uintptr_t)end - (uintptr_t)start; 1433cab2bb3Spatrick 1443cab2bb3Spatrick const uintptr_t mask = ~(dword_size - 1); 1453cab2bb3Spatrick const uintptr_t start_dword = ((uintptr_t)start) & mask; 1463cab2bb3Spatrick const uintptr_t end_dword = ((uintptr_t)start + len + dword_size - 1) & mask; 1473cab2bb3Spatrick 1483cab2bb3Spatrick for (uintptr_t dword = start_dword; dword < end_dword; dword += dword_size) 1493cab2bb3Spatrick __asm__ volatile("flush %0" : : "r"(dword)); 150*cfed65dbSpatrick #elif defined(__riscv) && defined(__linux__) 151*cfed65dbSpatrick #define __NR_riscv_flush_icache (244 + 15) 152*cfed65dbSpatrick register void *start_reg __asm("a0") = start; 153*cfed65dbSpatrick const register void *end_reg __asm("a1") = end; 154*cfed65dbSpatrick const register long flags __asm("a2") = 0; 155*cfed65dbSpatrick const register long syscall_nr __asm("a7") = __NR_riscv_flush_icache; 156*cfed65dbSpatrick __asm __volatile("ecall" 157*cfed65dbSpatrick : "=r"(start_reg) 158*cfed65dbSpatrick : "r"(start_reg), "r"(end_reg), "r"(flags), "r"(syscall_nr)); 159*cfed65dbSpatrick assert(start_reg == 0 && "Cache flush syscall failed."); 1603cab2bb3Spatrick #else 1613cab2bb3Spatrick #if __APPLE__ 1623cab2bb3Spatrick // On Darwin, sys_icache_invalidate() provides this functionality 1633cab2bb3Spatrick sys_icache_invalidate(start, end - start); 1643cab2bb3Spatrick #else 1653cab2bb3Spatrick compilerrt_abort(); 1663cab2bb3Spatrick #endif 1673cab2bb3Spatrick #endif 1683cab2bb3Spatrick } 169