| /* SPDX-License-Identifier: LGPL-2.1 OR MIT */ | 
 | /* | 
 |  * rseq-x86.h | 
 |  * | 
 |  * (C) Copyright 2016-2022 - Mathieu Desnoyers <mathieu.desnoyers@efficios.com> | 
 |  */ | 
 |  | 
 | #ifndef RSEQ_H | 
 | #error "Never use <rseq-x86.h> directly; include <rseq.h> instead." | 
 | #endif | 
 |  | 
 | #include <stdint.h> | 
 |  | 
 | /* | 
 |  * RSEQ_SIG is used with the following reserved undefined instructions, which | 
 |  * trap in user-space: | 
 |  * | 
 |  * x86-32:    0f b9 3d 53 30 05 53      ud1    0x53053053,%edi | 
 |  * x86-64:    0f b9 3d 53 30 05 53      ud1    0x53053053(%rip),%edi | 
 |  */ | 
 | #define RSEQ_SIG	0x53053053 | 
 |  | 
 | /* | 
 |  * Due to a compiler optimization bug in gcc-8 with asm goto and TLS asm input | 
 |  * operands, we cannot use "m" input operands, and rather pass the __rseq_abi | 
 |  * address through a "r" input operand. | 
 |  */ | 
 |  | 
 | /* Offset of cpu_id, rseq_cs, and mm_cid fields in struct rseq. */ | 
 | #define RSEQ_CPU_ID_OFFSET	4 | 
 | #define RSEQ_CS_OFFSET		8 | 
 | #define RSEQ_MM_CID_OFFSET	24 | 
 |  | 
 | #ifdef __x86_64__ | 
 |  | 
 | #define RSEQ_ASM_TP_SEGMENT	%%fs | 
 |  | 
 | #define rseq_smp_mb()	\ | 
 | 	__asm__ __volatile__ ("lock; addl $0,-128(%%rsp)" ::: "memory", "cc") | 
 | #define rseq_smp_rmb()	rseq_barrier() | 
 | #define rseq_smp_wmb()	rseq_barrier() | 
 |  | 
 | #define rseq_smp_load_acquire(p)					\ | 
 | __extension__ ({							\ | 
 | 	rseq_unqual_scalar_typeof(*(p)) ____p1 = RSEQ_READ_ONCE(*(p));	\ | 
 | 	rseq_barrier();							\ | 
 | 	____p1;								\ | 
 | }) | 
 |  | 
 | #define rseq_smp_acquire__after_ctrl_dep()	rseq_smp_rmb() | 
 |  | 
 | #define rseq_smp_store_release(p, v)					\ | 
 | do {									\ | 
 | 	rseq_barrier();							\ | 
 | 	RSEQ_WRITE_ONCE(*(p), v);					\ | 
 | } while (0) | 
 |  | 
 | #define __RSEQ_ASM_DEFINE_TABLE(label, version, flags,			\ | 
 | 				start_ip, post_commit_offset, abort_ip)	\ | 
 | 		".pushsection __rseq_cs, \"aw\"\n\t"			\ | 
 | 		".balign 32\n\t"					\ | 
 | 		__rseq_str(label) ":\n\t"				\ | 
 | 		".long " __rseq_str(version) ", " __rseq_str(flags) "\n\t" \ | 
 | 		".quad " __rseq_str(start_ip) ", " __rseq_str(post_commit_offset) ", " __rseq_str(abort_ip) "\n\t" \ | 
 | 		".popsection\n\t"					\ | 
 | 		".pushsection __rseq_cs_ptr_array, \"aw\"\n\t"		\ | 
 | 		".quad " __rseq_str(label) "b\n\t"			\ | 
 | 		".popsection\n\t" | 
 |  | 
 |  | 
 | #define RSEQ_ASM_DEFINE_TABLE(label, start_ip, post_commit_ip, abort_ip) \ | 
 | 	__RSEQ_ASM_DEFINE_TABLE(label, 0x0, 0x0, start_ip,		\ | 
 | 				(post_commit_ip - start_ip), abort_ip) | 
 |  | 
 | /* | 
 |  * Exit points of a rseq critical section consist of all instructions outside | 
 |  * of the critical section where a critical section can either branch to or | 
 |  * reach through the normal course of its execution. The abort IP and the | 
 |  * post-commit IP are already part of the __rseq_cs section and should not be | 
 |  * explicitly defined as additional exit points. Knowing all exit points is | 
 |  * useful to assist debuggers stepping over the critical section. | 
 |  */ | 
 | #define RSEQ_ASM_DEFINE_EXIT_POINT(start_ip, exit_ip)			\ | 
 | 		".pushsection __rseq_exit_point_array, \"aw\"\n\t"	\ | 
 | 		".quad " __rseq_str(start_ip) ", " __rseq_str(exit_ip) "\n\t" \ | 
 | 		".popsection\n\t" | 
 |  | 
 | #define RSEQ_ASM_STORE_RSEQ_CS(label, cs_label, rseq_cs)		\ | 
 | 		RSEQ_INJECT_ASM(1)					\ | 
 | 		"leaq " __rseq_str(cs_label) "(%%rip), %%rax\n\t"	\ | 
 | 		"movq %%rax, " __rseq_str(rseq_cs) "\n\t"		\ | 
 | 		__rseq_str(label) ":\n\t" | 
 |  | 
 | #define RSEQ_ASM_CMP_CPU_ID(cpu_id, current_cpu_id, label)		\ | 
 | 		RSEQ_INJECT_ASM(2)					\ | 
 | 		"cmpl %[" __rseq_str(cpu_id) "], " __rseq_str(current_cpu_id) "\n\t" \ | 
 | 		"jnz " __rseq_str(label) "\n\t" | 
 |  | 
 | #define RSEQ_ASM_DEFINE_ABORT(label, teardown, abort_label)		\ | 
 | 		".pushsection __rseq_failure, \"ax\"\n\t"		\ | 
 | 		/* Disassembler-friendly signature: ud1 <sig>(%rip),%edi. */ \ | 
 | 		".byte 0x0f, 0xb9, 0x3d\n\t"				\ | 
 | 		".long " __rseq_str(RSEQ_SIG) "\n\t"			\ | 
 | 		__rseq_str(label) ":\n\t"				\ | 
 | 		teardown						\ | 
 | 		"jmp %l[" __rseq_str(abort_label) "]\n\t"		\ | 
 | 		".popsection\n\t" | 
 |  | 
 | #define RSEQ_ASM_DEFINE_CMPFAIL(label, teardown, cmpfail_label)		\ | 
 | 		".pushsection __rseq_failure, \"ax\"\n\t"		\ | 
 | 		__rseq_str(label) ":\n\t"				\ | 
 | 		teardown						\ | 
 | 		"jmp %l[" __rseq_str(cmpfail_label) "]\n\t"		\ | 
 | 		".popsection\n\t" | 
 |  | 
 | #elif defined(__i386__) | 
 |  | 
 | #define RSEQ_ASM_TP_SEGMENT	%%gs | 
 |  | 
 | #define rseq_smp_mb()	\ | 
 | 	__asm__ __volatile__ ("lock; addl $0,-128(%%esp)" ::: "memory", "cc") | 
 | #define rseq_smp_rmb()	\ | 
 | 	__asm__ __volatile__ ("lock; addl $0,-128(%%esp)" ::: "memory", "cc") | 
 | #define rseq_smp_wmb()	\ | 
 | 	__asm__ __volatile__ ("lock; addl $0,-128(%%esp)" ::: "memory", "cc") | 
 |  | 
 | #define rseq_smp_load_acquire(p)					\ | 
 | __extension__ ({							\ | 
 | 	__typeof(*p) ____p1 = RSEQ_READ_ONCE(*p);			\ | 
 | 	rseq_smp_mb();							\ | 
 | 	____p1;								\ | 
 | }) | 
 |  | 
 | #define rseq_smp_acquire__after_ctrl_dep()	rseq_smp_rmb() | 
 |  | 
 | #define rseq_smp_store_release(p, v)					\ | 
 | do {									\ | 
 | 	rseq_smp_mb();							\ | 
 | 	RSEQ_WRITE_ONCE(*p, v);						\ | 
 | } while (0) | 
 |  | 
 | /* | 
 |  * Use eax as scratch register and take memory operands as input to | 
 |  * lessen register pressure. Especially needed when compiling in O0. | 
 |  */ | 
 | #define __RSEQ_ASM_DEFINE_TABLE(label, version, flags,			\ | 
 | 				start_ip, post_commit_offset, abort_ip)	\ | 
 | 		".pushsection __rseq_cs, \"aw\"\n\t"			\ | 
 | 		".balign 32\n\t"					\ | 
 | 		__rseq_str(label) ":\n\t"				\ | 
 | 		".long " __rseq_str(version) ", " __rseq_str(flags) "\n\t" \ | 
 | 		".long " __rseq_str(start_ip) ", 0x0, " __rseq_str(post_commit_offset) ", 0x0, " __rseq_str(abort_ip) ", 0x0\n\t" \ | 
 | 		".popsection\n\t"					\ | 
 | 		".pushsection __rseq_cs_ptr_array, \"aw\"\n\t"		\ | 
 | 		".long " __rseq_str(label) "b, 0x0\n\t"			\ | 
 | 		".popsection\n\t" | 
 |  | 
 | #define RSEQ_ASM_DEFINE_TABLE(label, start_ip, post_commit_ip, abort_ip) \ | 
 | 	__RSEQ_ASM_DEFINE_TABLE(label, 0x0, 0x0, start_ip,		\ | 
 | 				(post_commit_ip - start_ip), abort_ip) | 
 |  | 
 | /* | 
 |  * Exit points of a rseq critical section consist of all instructions outside | 
 |  * of the critical section where a critical section can either branch to or | 
 |  * reach through the normal course of its execution. The abort IP and the | 
 |  * post-commit IP are already part of the __rseq_cs section and should not be | 
 |  * explicitly defined as additional exit points. Knowing all exit points is | 
 |  * useful to assist debuggers stepping over the critical section. | 
 |  */ | 
 | #define RSEQ_ASM_DEFINE_EXIT_POINT(start_ip, exit_ip)			\ | 
 | 		".pushsection __rseq_exit_point_array, \"aw\"\n\t"	\ | 
 | 		".long " __rseq_str(start_ip) ", 0x0, " __rseq_str(exit_ip) ", 0x0\n\t" \ | 
 | 		".popsection\n\t" | 
 |  | 
 | #define RSEQ_ASM_STORE_RSEQ_CS(label, cs_label, rseq_cs)		\ | 
 | 		RSEQ_INJECT_ASM(1)					\ | 
 | 		"movl $" __rseq_str(cs_label) ", " __rseq_str(rseq_cs) "\n\t"	\ | 
 | 		__rseq_str(label) ":\n\t" | 
 |  | 
 | #define RSEQ_ASM_CMP_CPU_ID(cpu_id, current_cpu_id, label)		\ | 
 | 		RSEQ_INJECT_ASM(2)					\ | 
 | 		"cmpl %[" __rseq_str(cpu_id) "], " __rseq_str(current_cpu_id) "\n\t" \ | 
 | 		"jnz " __rseq_str(label) "\n\t" | 
 |  | 
 | #define RSEQ_ASM_DEFINE_ABORT(label, teardown, abort_label)		\ | 
 | 		".pushsection __rseq_failure, \"ax\"\n\t"		\ | 
 | 		/* Disassembler-friendly signature: ud1 <sig>,%edi. */	\ | 
 | 		".byte 0x0f, 0xb9, 0x3d\n\t"				\ | 
 | 		".long " __rseq_str(RSEQ_SIG) "\n\t"			\ | 
 | 		__rseq_str(label) ":\n\t"				\ | 
 | 		teardown						\ | 
 | 		"jmp %l[" __rseq_str(abort_label) "]\n\t"		\ | 
 | 		".popsection\n\t" | 
 |  | 
 | #define RSEQ_ASM_DEFINE_CMPFAIL(label, teardown, cmpfail_label)		\ | 
 | 		".pushsection __rseq_failure, \"ax\"\n\t"		\ | 
 | 		__rseq_str(label) ":\n\t"				\ | 
 | 		teardown						\ | 
 | 		"jmp %l[" __rseq_str(cmpfail_label) "]\n\t"		\ | 
 | 		".popsection\n\t" | 
 |  | 
 | #endif | 
 |  | 
 | /* Per-cpu-id indexing. */ | 
 |  | 
 | #define RSEQ_TEMPLATE_CPU_ID | 
 | #define RSEQ_TEMPLATE_MO_RELAXED | 
 | #include "rseq-x86-bits.h" | 
 | #undef RSEQ_TEMPLATE_MO_RELAXED | 
 |  | 
 | #define RSEQ_TEMPLATE_MO_RELEASE | 
 | #include "rseq-x86-bits.h" | 
 | #undef RSEQ_TEMPLATE_MO_RELEASE | 
 | #undef RSEQ_TEMPLATE_CPU_ID | 
 |  | 
 | /* Per-mm-cid indexing. */ | 
 |  | 
 | #define RSEQ_TEMPLATE_MM_CID | 
 | #define RSEQ_TEMPLATE_MO_RELAXED | 
 | #include "rseq-x86-bits.h" | 
 | #undef RSEQ_TEMPLATE_MO_RELAXED | 
 |  | 
 | #define RSEQ_TEMPLATE_MO_RELEASE | 
 | #include "rseq-x86-bits.h" | 
 | #undef RSEQ_TEMPLATE_MO_RELEASE | 
 | #undef RSEQ_TEMPLATE_MM_CID | 
 |  | 
 | /* APIs which are not based on cpu ids. */ | 
 |  | 
 | #define RSEQ_TEMPLATE_CPU_ID_NONE | 
 | #define RSEQ_TEMPLATE_MO_RELAXED | 
 | #include "rseq-x86-bits.h" | 
 | #undef RSEQ_TEMPLATE_MO_RELAXED | 
 | #undef RSEQ_TEMPLATE_CPU_ID_NONE |