13cab2bb3Spatrick //===-- linux.cpp -----------------------------------------------*- C++ -*-===//
23cab2bb3Spatrick //
33cab2bb3Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
43cab2bb3Spatrick // See https://llvm.org/LICENSE.txt for license information.
53cab2bb3Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
63cab2bb3Spatrick //
73cab2bb3Spatrick //===----------------------------------------------------------------------===//
83cab2bb3Spatrick
93cab2bb3Spatrick #include "platform.h"
103cab2bb3Spatrick
113cab2bb3Spatrick #if SCUDO_LINUX
123cab2bb3Spatrick
133cab2bb3Spatrick #include "common.h"
143cab2bb3Spatrick #include "linux.h"
153cab2bb3Spatrick #include "mutex.h"
163cab2bb3Spatrick #include "string_utils.h"
173cab2bb3Spatrick
183cab2bb3Spatrick #include <errno.h>
193cab2bb3Spatrick #include <fcntl.h>
203cab2bb3Spatrick #include <linux/futex.h>
213cab2bb3Spatrick #include <sched.h>
22*810390e3Srobert #include <stdio.h>
233cab2bb3Spatrick #include <stdlib.h>
243cab2bb3Spatrick #include <string.h>
253cab2bb3Spatrick #include <sys/mman.h>
263cab2bb3Spatrick #include <sys/stat.h>
273cab2bb3Spatrick #include <sys/syscall.h>
283cab2bb3Spatrick #include <sys/time.h>
293cab2bb3Spatrick #include <time.h>
303cab2bb3Spatrick #include <unistd.h>
313cab2bb3Spatrick
323cab2bb3Spatrick #if SCUDO_ANDROID
333cab2bb3Spatrick #include <sys/prctl.h>
343cab2bb3Spatrick // Definitions of prctl arguments to set a vma name in Android kernels.
353cab2bb3Spatrick #define ANDROID_PR_SET_VMA 0x53564d41
363cab2bb3Spatrick #define ANDROID_PR_SET_VMA_ANON_NAME 0
373cab2bb3Spatrick #endif
383cab2bb3Spatrick
393cab2bb3Spatrick namespace scudo {
403cab2bb3Spatrick
getPageSize()413cab2bb3Spatrick uptr getPageSize() { return static_cast<uptr>(sysconf(_SC_PAGESIZE)); }
423cab2bb3Spatrick
die()433cab2bb3Spatrick void NORETURN die() { abort(); }
443cab2bb3Spatrick
map(void * Addr,uptr Size,UNUSED const char * Name,uptr Flags,UNUSED MapPlatformData * Data)453cab2bb3Spatrick void *map(void *Addr, uptr Size, UNUSED const char *Name, uptr Flags,
463cab2bb3Spatrick UNUSED MapPlatformData *Data) {
473cab2bb3Spatrick int MmapFlags = MAP_PRIVATE | MAP_ANONYMOUS;
483cab2bb3Spatrick int MmapProt;
493cab2bb3Spatrick if (Flags & MAP_NOACCESS) {
503cab2bb3Spatrick MmapFlags |= MAP_NORESERVE;
513cab2bb3Spatrick MmapProt = PROT_NONE;
523cab2bb3Spatrick } else {
533cab2bb3Spatrick MmapProt = PROT_READ | PROT_WRITE;
54d89ec533Spatrick }
55d89ec533Spatrick #if defined(__aarch64__)
56d89ec533Spatrick #ifndef PROT_MTE
57d89ec533Spatrick #define PROT_MTE 0x20
58d89ec533Spatrick #endif
591f9cb04fSpatrick if (Flags & MAP_MEMTAG)
601f9cb04fSpatrick MmapProt |= PROT_MTE;
611f9cb04fSpatrick #endif
62d89ec533Spatrick if (Addr)
633cab2bb3Spatrick MmapFlags |= MAP_FIXED;
643cab2bb3Spatrick void *P = mmap(Addr, Size, MmapProt, MmapFlags, -1, 0);
653cab2bb3Spatrick if (P == MAP_FAILED) {
663cab2bb3Spatrick if (!(Flags & MAP_ALLOWNOMEM) || errno != ENOMEM)
67d89ec533Spatrick dieOnMapUnmapError(errno == ENOMEM ? Size : 0);
683cab2bb3Spatrick return nullptr;
693cab2bb3Spatrick }
703cab2bb3Spatrick #if SCUDO_ANDROID
71d89ec533Spatrick if (Name)
723cab2bb3Spatrick prctl(ANDROID_PR_SET_VMA, ANDROID_PR_SET_VMA_ANON_NAME, P, Size, Name);
733cab2bb3Spatrick #endif
743cab2bb3Spatrick return P;
753cab2bb3Spatrick }
763cab2bb3Spatrick
unmap(void * Addr,uptr Size,UNUSED uptr Flags,UNUSED MapPlatformData * Data)773cab2bb3Spatrick void unmap(void *Addr, uptr Size, UNUSED uptr Flags,
783cab2bb3Spatrick UNUSED MapPlatformData *Data) {
793cab2bb3Spatrick if (munmap(Addr, Size) != 0)
803cab2bb3Spatrick dieOnMapUnmapError();
813cab2bb3Spatrick }
823cab2bb3Spatrick
setMemoryPermission(uptr Addr,uptr Size,uptr Flags,UNUSED MapPlatformData * Data)83d89ec533Spatrick void setMemoryPermission(uptr Addr, uptr Size, uptr Flags,
84d89ec533Spatrick UNUSED MapPlatformData *Data) {
85d89ec533Spatrick int Prot = (Flags & MAP_NOACCESS) ? PROT_NONE : (PROT_READ | PROT_WRITE);
86d89ec533Spatrick if (mprotect(reinterpret_cast<void *>(Addr), Size, Prot) != 0)
87d89ec533Spatrick dieOnMapUnmapError();
88d89ec533Spatrick }
89d89ec533Spatrick
releasePagesToOS(uptr BaseAddress,uptr Offset,uptr Size,UNUSED MapPlatformData * Data)903cab2bb3Spatrick void releasePagesToOS(uptr BaseAddress, uptr Offset, uptr Size,
913cab2bb3Spatrick UNUSED MapPlatformData *Data) {
923cab2bb3Spatrick void *Addr = reinterpret_cast<void *>(BaseAddress + Offset);
93d89ec533Spatrick
943cab2bb3Spatrick while (madvise(Addr, Size, MADV_DONTNEED) == -1 && errno == EAGAIN) {
953cab2bb3Spatrick }
963cab2bb3Spatrick }
973cab2bb3Spatrick
983cab2bb3Spatrick // Calling getenv should be fine (c)(tm) at any time.
getEnv(const char * Name)993cab2bb3Spatrick const char *getEnv(const char *Name) { return getenv(Name); }
1003cab2bb3Spatrick
1013cab2bb3Spatrick namespace {
1023cab2bb3Spatrick enum State : u32 { Unlocked = 0, Locked = 1, Sleeping = 2 };
1033cab2bb3Spatrick }
1043cab2bb3Spatrick
tryLock()1053cab2bb3Spatrick bool HybridMutex::tryLock() {
1063cab2bb3Spatrick return atomic_compare_exchange(&M, Unlocked, Locked) == Unlocked;
1073cab2bb3Spatrick }
1083cab2bb3Spatrick
1093cab2bb3Spatrick // The following is based on https://akkadia.org/drepper/futex.pdf.
lockSlow()1103cab2bb3Spatrick void HybridMutex::lockSlow() {
1113cab2bb3Spatrick u32 V = atomic_compare_exchange(&M, Unlocked, Locked);
1123cab2bb3Spatrick if (V == Unlocked)
1133cab2bb3Spatrick return;
1143cab2bb3Spatrick if (V != Sleeping)
1153cab2bb3Spatrick V = atomic_exchange(&M, Sleeping, memory_order_acquire);
1163cab2bb3Spatrick while (V != Unlocked) {
1173cab2bb3Spatrick syscall(SYS_futex, reinterpret_cast<uptr>(&M), FUTEX_WAIT_PRIVATE, Sleeping,
1183cab2bb3Spatrick nullptr, nullptr, 0);
1193cab2bb3Spatrick V = atomic_exchange(&M, Sleeping, memory_order_acquire);
1203cab2bb3Spatrick }
1213cab2bb3Spatrick }
1223cab2bb3Spatrick
unlock()1233cab2bb3Spatrick void HybridMutex::unlock() {
1243cab2bb3Spatrick if (atomic_fetch_sub(&M, 1U, memory_order_release) != Locked) {
1253cab2bb3Spatrick atomic_store(&M, Unlocked, memory_order_release);
1263cab2bb3Spatrick syscall(SYS_futex, reinterpret_cast<uptr>(&M), FUTEX_WAKE_PRIVATE, 1,
1273cab2bb3Spatrick nullptr, nullptr, 0);
1283cab2bb3Spatrick }
1293cab2bb3Spatrick }
1303cab2bb3Spatrick
getMonotonicTime()1313cab2bb3Spatrick u64 getMonotonicTime() {
1323cab2bb3Spatrick timespec TS;
1333cab2bb3Spatrick clock_gettime(CLOCK_MONOTONIC, &TS);
1343cab2bb3Spatrick return static_cast<u64>(TS.tv_sec) * (1000ULL * 1000 * 1000) +
1353cab2bb3Spatrick static_cast<u64>(TS.tv_nsec);
1363cab2bb3Spatrick }
1373cab2bb3Spatrick
getNumberOfCPUs()1383cab2bb3Spatrick u32 getNumberOfCPUs() {
1393cab2bb3Spatrick cpu_set_t CPUs;
1401f9cb04fSpatrick // sched_getaffinity can fail for a variety of legitimate reasons (lack of
1411f9cb04fSpatrick // CAP_SYS_NICE, syscall filtering, etc), in which case we shall return 0.
1421f9cb04fSpatrick if (sched_getaffinity(0, sizeof(cpu_set_t), &CPUs) != 0)
1431f9cb04fSpatrick return 0;
1443cab2bb3Spatrick return static_cast<u32>(CPU_COUNT(&CPUs));
1453cab2bb3Spatrick }
1463cab2bb3Spatrick
getThreadID()1471f9cb04fSpatrick u32 getThreadID() {
1481f9cb04fSpatrick #if SCUDO_ANDROID
1491f9cb04fSpatrick return static_cast<u32>(gettid());
1501f9cb04fSpatrick #else
1511f9cb04fSpatrick return static_cast<u32>(syscall(SYS_gettid));
1521f9cb04fSpatrick #endif
1531f9cb04fSpatrick }
1541f9cb04fSpatrick
1553cab2bb3Spatrick // Blocking is possibly unused if the getrandom block is not compiled in.
getRandom(void * Buffer,uptr Length,UNUSED bool Blocking)1563cab2bb3Spatrick bool getRandom(void *Buffer, uptr Length, UNUSED bool Blocking) {
1573cab2bb3Spatrick if (!Buffer || !Length || Length > MaxRandomLength)
1583cab2bb3Spatrick return false;
1593cab2bb3Spatrick ssize_t ReadBytes;
1603cab2bb3Spatrick #if defined(SYS_getrandom)
1613cab2bb3Spatrick #if !defined(GRND_NONBLOCK)
1623cab2bb3Spatrick #define GRND_NONBLOCK 1
1633cab2bb3Spatrick #endif
1643cab2bb3Spatrick // Up to 256 bytes, getrandom will not be interrupted.
1653cab2bb3Spatrick ReadBytes =
1663cab2bb3Spatrick syscall(SYS_getrandom, Buffer, Length, Blocking ? 0 : GRND_NONBLOCK);
1673cab2bb3Spatrick if (ReadBytes == static_cast<ssize_t>(Length))
1683cab2bb3Spatrick return true;
1693cab2bb3Spatrick #endif // defined(SYS_getrandom)
1703cab2bb3Spatrick // Up to 256 bytes, a read off /dev/urandom will not be interrupted.
1713cab2bb3Spatrick // Blocking is moot here, O_NONBLOCK has no effect when opening /dev/urandom.
1723cab2bb3Spatrick const int FileDesc = open("/dev/urandom", O_RDONLY);
1733cab2bb3Spatrick if (FileDesc == -1)
1743cab2bb3Spatrick return false;
1753cab2bb3Spatrick ReadBytes = read(FileDesc, Buffer, Length);
1763cab2bb3Spatrick close(FileDesc);
1773cab2bb3Spatrick return (ReadBytes == static_cast<ssize_t>(Length));
1783cab2bb3Spatrick }
1793cab2bb3Spatrick
1801f9cb04fSpatrick // Allocation free syslog-like API.
1811f9cb04fSpatrick extern "C" WEAK int async_safe_write_log(int pri, const char *tag,
1821f9cb04fSpatrick const char *msg);
1831f9cb04fSpatrick
GetRSSFromBuffer(const char * Buf)184*810390e3Srobert static uptr GetRSSFromBuffer(const char *Buf) {
185*810390e3Srobert // The format of the file is:
186*810390e3Srobert // 1084 89 69 11 0 79 0
187*810390e3Srobert // We need the second number which is RSS in pages.
188*810390e3Srobert const char *Pos = Buf;
189*810390e3Srobert // Skip the first number.
190*810390e3Srobert while (*Pos >= '0' && *Pos <= '9')
191*810390e3Srobert Pos++;
192*810390e3Srobert // Skip whitespaces.
193*810390e3Srobert while (!(*Pos >= '0' && *Pos <= '9') && *Pos != 0)
194*810390e3Srobert Pos++;
195*810390e3Srobert // Read the number.
196*810390e3Srobert u64 Rss = 0;
197*810390e3Srobert for (; *Pos >= '0' && *Pos <= '9'; Pos++)
198*810390e3Srobert Rss = Rss * 10 + static_cast<u64>(*Pos) - '0';
199*810390e3Srobert return static_cast<uptr>(Rss * getPageSizeCached());
200*810390e3Srobert }
201*810390e3Srobert
GetRSS()202*810390e3Srobert uptr GetRSS() {
203*810390e3Srobert // TODO: We currently use sanitizer_common's GetRSS which reads the
204*810390e3Srobert // RSS from /proc/self/statm by default. We might want to
205*810390e3Srobert // call getrusage directly, even if it's less accurate.
206*810390e3Srobert auto Fd = open("/proc/self/statm", O_RDONLY);
207*810390e3Srobert char Buf[64];
208*810390e3Srobert s64 Len = read(Fd, Buf, sizeof(Buf) - 1);
209*810390e3Srobert close(Fd);
210*810390e3Srobert if (Len <= 0)
211*810390e3Srobert return 0;
212*810390e3Srobert Buf[Len] = 0;
213*810390e3Srobert
214*810390e3Srobert return GetRSSFromBuffer(Buf);
215*810390e3Srobert }
216*810390e3Srobert
outputRaw(const char * Buffer)2173cab2bb3Spatrick void outputRaw(const char *Buffer) {
2181f9cb04fSpatrick if (&async_safe_write_log) {
2191f9cb04fSpatrick constexpr s32 AndroidLogInfo = 4;
2201f9cb04fSpatrick constexpr uptr MaxLength = 1024U;
2211f9cb04fSpatrick char LocalBuffer[MaxLength];
2221f9cb04fSpatrick while (strlen(Buffer) > MaxLength) {
2231f9cb04fSpatrick uptr P;
2241f9cb04fSpatrick for (P = MaxLength - 1; P > 0; P--) {
2251f9cb04fSpatrick if (Buffer[P] == '\n') {
2261f9cb04fSpatrick memcpy(LocalBuffer, Buffer, P);
2271f9cb04fSpatrick LocalBuffer[P] = '\0';
2281f9cb04fSpatrick async_safe_write_log(AndroidLogInfo, "scudo", LocalBuffer);
2291f9cb04fSpatrick Buffer = &Buffer[P + 1];
2301f9cb04fSpatrick break;
2311f9cb04fSpatrick }
2321f9cb04fSpatrick }
2331f9cb04fSpatrick // If no newline was found, just log the buffer.
2341f9cb04fSpatrick if (P == 0)
2351f9cb04fSpatrick break;
2361f9cb04fSpatrick }
2371f9cb04fSpatrick async_safe_write_log(AndroidLogInfo, "scudo", Buffer);
2381f9cb04fSpatrick } else {
239d89ec533Spatrick (void)write(2, Buffer, strlen(Buffer));
2403cab2bb3Spatrick }
2411f9cb04fSpatrick }
2423cab2bb3Spatrick
2433cab2bb3Spatrick extern "C" WEAK void android_set_abort_message(const char *);
2443cab2bb3Spatrick
setAbortMessage(const char * Message)2453cab2bb3Spatrick void setAbortMessage(const char *Message) {
2463cab2bb3Spatrick if (&android_set_abort_message)
2473cab2bb3Spatrick android_set_abort_message(Message);
2483cab2bb3Spatrick }
2493cab2bb3Spatrick
2503cab2bb3Spatrick } // namespace scudo
2513cab2bb3Spatrick
2523cab2bb3Spatrick #endif // SCUDO_LINUX
253