/* SPDX-License-Identifier: LGPL-2.1 OR MIT */ /* * rseq.h * * (C) Copyright 2016-2018 - Mathieu Desnoyers */ #ifndef RSEQ_H #define RSEQ_H #include #include #include #include #include #include #include #include #include #include "rseq-abi.h" #include "compiler.h" #ifndef rseq_sizeof_field #define rseq_sizeof_field(TYPE, MEMBER) sizeof((((TYPE *)0)->MEMBER)) #endif #ifndef rseq_offsetofend #define rseq_offsetofend(TYPE, MEMBER) \ (offsetof(TYPE, MEMBER) + rseq_sizeof_field(TYPE, MEMBER)) #endif /* * Empty code injection macros, override when testing. * It is important to consider that the ASM injection macros need to be * fully reentrant (e.g. do not modify the stack). */ #ifndef RSEQ_INJECT_ASM #define RSEQ_INJECT_ASM(n) #endif #ifndef RSEQ_INJECT_C #define RSEQ_INJECT_C(n) #endif #ifndef RSEQ_INJECT_INPUT #define RSEQ_INJECT_INPUT #endif #ifndef RSEQ_INJECT_CLOBBER #define RSEQ_INJECT_CLOBBER #endif #ifndef RSEQ_INJECT_FAILED #define RSEQ_INJECT_FAILED #endif #include "rseq-thread-pointer.h" /* Offset from the thread pointer to the rseq area. */ extern ptrdiff_t rseq_offset; /* * Size of the registered rseq area. 0 if the registration was * unsuccessful. */ extern unsigned int rseq_size; /* Flags used during rseq registration. */ extern unsigned int rseq_flags; /* * rseq feature size supported by the kernel. 0 if the registration was * unsuccessful. */ extern unsigned int rseq_feature_size; enum rseq_mo { RSEQ_MO_RELAXED = 0, RSEQ_MO_CONSUME = 1, /* Unused */ RSEQ_MO_ACQUIRE = 2, /* Unused */ RSEQ_MO_RELEASE = 3, RSEQ_MO_ACQ_REL = 4, /* Unused */ RSEQ_MO_SEQ_CST = 5, /* Unused */ }; enum rseq_percpu_mode { RSEQ_PERCPU_CPU_ID = 0, RSEQ_PERCPU_MM_CID = 1, }; static inline struct rseq_abi *rseq_get_abi(void) { return (struct rseq_abi *) ((uintptr_t) rseq_thread_pointer() + rseq_offset); } #define rseq_likely(x) __builtin_expect(!!(x), 1) #define rseq_unlikely(x) __builtin_expect(!!(x), 0) #define rseq_barrier() __asm__ __volatile__("" : : : "memory") #define RSEQ_ACCESS_ONCE(x) (*(__volatile__ __typeof__(x) *)&(x)) #define RSEQ_WRITE_ONCE(x, v) __extension__ ({ RSEQ_ACCESS_ONCE(x) = (v); }) #define RSEQ_READ_ONCE(x) RSEQ_ACCESS_ONCE(x) #define __rseq_str_1(x) #x #define __rseq_str(x) __rseq_str_1(x) #define rseq_log(fmt, args...) \ fprintf(stderr, fmt "(in %s() at " __FILE__ ":" __rseq_str(__LINE__)"\n", \ ## args, __func__) #define rseq_bug(fmt, args...) \ do { \ rseq_log(fmt, ##args); \ abort(); \ } while (0) #if defined(__x86_64__) || defined(__i386__) #include #elif defined(__ARMEL__) #include #elif defined (__AARCH64EL__) #include #elif defined(__PPC__) #include #elif defined(__mips__) #include #elif defined(__s390__) #include #elif defined(__riscv) #include #else #error unsupported target #endif /* * Register rseq for the current thread. This needs to be called once * by any thread which uses restartable sequences, before they start * using restartable sequences, to ensure restartable sequences * succeed. A restartable sequence executed from a non-registered * thread will always fail. */ int rseq_register_current_thread(void); /* * Unregister rseq for current thread. */ int rseq_unregister_current_thread(void); /* * Restartable sequence fallback for reading the current CPU number. */ int32_t rseq_fallback_current_cpu(void); /* * Restartable sequence fallback for reading the current node number. */ int32_t rseq_fallback_current_node(void); /* * Values returned can be either the current CPU number, -1 (rseq is * uninitialized), or -2 (rseq initialization has failed). */ static inline int32_t rseq_current_cpu_raw(void) { return RSEQ_ACCESS_ONCE(rseq_get_abi()->cpu_id); } /* * Returns a possible CPU number, which is typically the current CPU. * The returned CPU number can be used to prepare for an rseq critical * section, which will confirm whether the cpu number is indeed the * current one, and whether rseq is initialized. * * The CPU number returned by rseq_cpu_start should always be validated * by passing it to a rseq asm sequence, or by comparing it to the * return value of rseq_current_cpu_raw() if the rseq asm sequence * does not need to be invoked. */ static inline uint32_t rseq_cpu_start(void) { return RSEQ_ACCESS_ONCE(rseq_get_abi()->cpu_id_start); } static inline uint32_t rseq_current_cpu(void) { int32_t cpu; cpu = rseq_current_cpu_raw(); if (rseq_unlikely(cpu < 0)) cpu = rseq_fallback_current_cpu(); return cpu; } static inline bool rseq_node_id_available(void) { return (int) rseq_feature_size >= rseq_offsetofend(struct rseq_abi, node_id); } /* * Current NUMA node number. */ static inline uint32_t rseq_current_node_id(void) { assert(rseq_node_id_available()); return RSEQ_ACCESS_ONCE(rseq_get_abi()->node_id); } static inline bool rseq_mm_cid_available(void) { return (int) rseq_feature_size >= rseq_offsetofend(struct rseq_abi, mm_cid); } static inline uint32_t rseq_current_mm_cid(void) { return RSEQ_ACCESS_ONCE(rseq_get_abi()->mm_cid); } static inline void rseq_clear_rseq_cs(void) { RSEQ_WRITE_ONCE(rseq_get_abi()->rseq_cs.arch.ptr, 0); } /* * rseq_prepare_unload() should be invoked by each thread executing a rseq * critical section at least once between their last critical section and * library unload of the library defining the rseq critical section (struct * rseq_cs) or the code referred to by the struct rseq_cs start_ip and * post_commit_offset fields. This also applies to use of rseq in code * generated by JIT: rseq_prepare_unload() should be invoked at least once by * each thread executing a rseq critical section before reclaim of the memory * holding the struct rseq_cs or reclaim of the code pointed to by struct * rseq_cs start_ip and post_commit_offset fields. */ static inline void rseq_prepare_unload(void) { rseq_clear_rseq_cs(); } static inline __attribute__((always_inline)) int rseq_cmpeqv_storev(enum rseq_mo rseq_mo, enum rseq_percpu_mode percpu_mode, intptr_t *v, intptr_t expect, intptr_t newv, int cpu) { if (rseq_mo != RSEQ_MO_RELAXED) return -1; switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_cmpeqv_storev_relaxed_cpu_id(v, expect, newv, cpu); case RSEQ_PERCPU_MM_CID: return rseq_cmpeqv_storev_relaxed_mm_cid(v, expect, newv, cpu); } return -1; } /* * Compare @v against @expectnot. When it does _not_ match, load @v * into @load, and store the content of *@v + voffp into @v. */ static inline __attribute__((always_inline)) int rseq_cmpnev_storeoffp_load(enum rseq_mo rseq_mo, enum rseq_percpu_mode percpu_mode, intptr_t *v, intptr_t expectnot, long voffp, intptr_t *load, int cpu) { if (rseq_mo != RSEQ_MO_RELAXED) return -1; switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_cmpnev_storeoffp_load_relaxed_cpu_id(v, expectnot, voffp, load, cpu); case RSEQ_PERCPU_MM_CID: return rseq_cmpnev_storeoffp_load_relaxed_mm_cid(v, expectnot, voffp, load, cpu); } return -1; } static inline __attribute__((always_inline)) int rseq_addv(enum rseq_mo rseq_mo, enum rseq_percpu_mode percpu_mode, intptr_t *v, intptr_t count, int cpu) { if (rseq_mo != RSEQ_MO_RELAXED) return -1; switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_addv_relaxed_cpu_id(v, count, cpu); case RSEQ_PERCPU_MM_CID: return rseq_addv_relaxed_mm_cid(v, count, cpu); } return -1; } #ifdef RSEQ_ARCH_HAS_OFFSET_DEREF_ADDV /* * pval = *(ptr+off) * *pval += inc; */ static inline __attribute__((always_inline)) int rseq_offset_deref_addv(enum rseq_mo rseq_mo, enum rseq_percpu_mode percpu_mode, intptr_t *ptr, long off, intptr_t inc, int cpu) { if (rseq_mo != RSEQ_MO_RELAXED) return -1; switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_offset_deref_addv_relaxed_cpu_id(ptr, off, inc, cpu); case RSEQ_PERCPU_MM_CID: return rseq_offset_deref_addv_relaxed_mm_cid(ptr, off, inc, cpu); } return -1; } #endif static inline __attribute__((always_inline)) int rseq_cmpeqv_trystorev_storev(enum rseq_mo rseq_mo, enum rseq_percpu_mode percpu_mode, intptr_t *v, intptr_t expect, intptr_t *v2, intptr_t newv2, intptr_t newv, int cpu) { switch (rseq_mo) { case RSEQ_MO_RELAXED: switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_cmpeqv_trystorev_storev_relaxed_cpu_id(v, expect, v2, newv2, newv, cpu); case RSEQ_PERCPU_MM_CID: return rseq_cmpeqv_trystorev_storev_relaxed_mm_cid(v, expect, v2, newv2, newv, cpu); } return -1; case RSEQ_MO_RELEASE: switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_cmpeqv_trystorev_storev_release_cpu_id(v, expect, v2, newv2, newv, cpu); case RSEQ_PERCPU_MM_CID: return rseq_cmpeqv_trystorev_storev_release_mm_cid(v, expect, v2, newv2, newv, cpu); } return -1; default: return -1; } } static inline __attribute__((always_inline)) int rseq_cmpeqv_cmpeqv_storev(enum rseq_mo rseq_mo, enum rseq_percpu_mode percpu_mode, intptr_t *v, intptr_t expect, intptr_t *v2, intptr_t expect2, intptr_t newv, int cpu) { if (rseq_mo != RSEQ_MO_RELAXED) return -1; switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_cmpeqv_cmpeqv_storev_relaxed_cpu_id(v, expect, v2, expect2, newv, cpu); case RSEQ_PERCPU_MM_CID: return rseq_cmpeqv_cmpeqv_storev_relaxed_mm_cid(v, expect, v2, expect2, newv, cpu); } return -1; } static inline __attribute__((always_inline)) int rseq_cmpeqv_trymemcpy_storev(enum rseq_mo rseq_mo, enum rseq_percpu_mode percpu_mode, intptr_t *v, intptr_t expect, void *dst, void *src, size_t len, intptr_t newv, int cpu) { switch (rseq_mo) { case RSEQ_MO_RELAXED: switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_cmpeqv_trymemcpy_storev_relaxed_cpu_id(v, expect, dst, src, len, newv, cpu); case RSEQ_PERCPU_MM_CID: return rseq_cmpeqv_trymemcpy_storev_relaxed_mm_cid(v, expect, dst, src, len, newv, cpu); } return -1; case RSEQ_MO_RELEASE: switch (percpu_mode) { case RSEQ_PERCPU_CPU_ID: return rseq_cmpeqv_trymemcpy_storev_release_cpu_id(v, expect, dst, src, len, newv, cpu); case RSEQ_PERCPU_MM_CID: return rseq_cmpeqv_trymemcpy_storev_release_mm_cid(v, expect, dst, src, len, newv, cpu); } return -1; default: return -1; } } #endif /* RSEQ_H_ */