2016-05-12 17:51:24 +03:00
|
|
|
/*
|
|
|
|
* CDDL HEADER START
|
|
|
|
*
|
|
|
|
* The contents of this file are subject to the terms of the
|
|
|
|
* Common Development and Distribution License (the "License").
|
|
|
|
* You may not use this file except in compliance with the License.
|
|
|
|
*
|
|
|
|
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
|
|
|
|
* or http://www.opensolaris.org/os/licensing.
|
|
|
|
* See the License for the specific language governing permissions
|
|
|
|
* and limitations under the License.
|
|
|
|
*
|
|
|
|
* When distributing Covered Code, include this CDDL HEADER in each
|
|
|
|
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
|
|
|
|
* If applicable, add the following below this CDDL HEADER, with the
|
|
|
|
* fields enclosed by brackets "[]" replaced with your own identifying
|
|
|
|
* information: Portions Copyright [yyyy] [name of copyright owner]
|
|
|
|
*
|
|
|
|
* CDDL HEADER END
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Copyright 2008 Sun Microsystems, Inc. All rights reserved.
|
|
|
|
* Use is subject to license terms.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef _IA32_SYS_ASM_LINKAGE_H
|
|
|
|
#define _IA32_SYS_ASM_LINKAGE_H
|
|
|
|
|
|
|
|
#include <sys/stack.h>
|
|
|
|
#include <sys/trap.h>
|
|
|
|
|
icp: properly fix all RETs in x86_64 Asm code
Commit 43569ee37420 ("Fix objtool: missing int3 after ret warning")
addressed replacing all `ret`s in x86 asm code to a macro in the
Linux kernel in order to enable SLS. That was done by copying the
upstream macro definitions and fixed objtool complaints.
Since then, several more mitigations were introduced, including
Rethunk. It requires to have a jump to one of the thunks in order
to work, so the RET macro was changed again. And, as ZFS code
didn't use the mainline defition, but copied it, this is currently
missing.
Objtool reminds about it time to time (Clang 16, CONFIG_RETHUNK=y):
fs/zfs/lua/zlua.o: warning: objtool: setjmp+0x25: 'naked' return
found in RETHUNK build
fs/zfs/lua/zlua.o: warning: objtool: longjmp+0x27: 'naked' return
found in RETHUNK build
Do it the following way:
* if we're building under Linux, unconditionally include
<linux/linkage.h> in the related files. It is available in x86
sources since even pre-2.6 times, so doesn't need any conftests;
* then, if RET macro is available, it will be used directly, so that
we will always have the version actual to the kernel we build;
* if there's no such macro, we define it as a simple `ret`, as it
was on pre-SLS times.
This ensures we always have the up-to-date definition with no need
to update it manually, and at the same time is safe for the whole
variety of kernels ZFS module supports.
Then, there's a couple more "naked" rets left in the code, they're
just defined as:
.byte 0xf3,0xc3
In fact, this is just:
rep ret
`rep ret` instead of just `ret` seems to mitigate performance issues
on some old AMD processors and most likely makes no sense as of
today.
Anyways, address those rets, so that they will be protected with
Rethunk and SLS. Include <sys/asm_linkage.h> here which now always
has RET definition and replace those constructs with just RET.
This wipes the last couple of places with unpatched rets objtool's
been complaining about.
Reviewed-by: Attila Fülöp <attila@fueloep.org>
Reviewed-by: Tino Reichardt <milky-zfs@mcmilk.de>
Reviewed-by: Richard Yao <richard.yao@alumni.stonybrook.edu>
Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov>
Signed-off-by: Alexander Lobakin <alobakin@pm.me>
Closes #14035
2022-10-16 17:53:22 +03:00
|
|
|
#if defined(_KERNEL) && defined(__linux__)
|
|
|
|
#include <linux/linkage.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef RET
|
2022-06-21 02:36:21 +03:00
|
|
|
#define RET ret
|
|
|
|
#endif
|
|
|
|
|
2016-05-12 17:51:24 +03:00
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef _ASM /* The remainder of this file is only for assembly files */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* make annoying differences in assembler syntax go away
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* D16 and A16 are used to insert instructions prefixes; the
|
|
|
|
* macros help the assembler code be slightly more portable.
|
|
|
|
*/
|
|
|
|
#if !defined(__GNUC_AS__)
|
|
|
|
/*
|
|
|
|
* /usr/ccs/bin/as prefixes are parsed as separate instructions
|
|
|
|
*/
|
|
|
|
#define D16 data16;
|
|
|
|
#define A16 addr16;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* (There are some weird constructs in constant expressions)
|
|
|
|
*/
|
|
|
|
#define _CONST(const) [const]
|
|
|
|
#define _BITNOT(const) -1!_CONST(const)
|
|
|
|
#define _MUL(a, b) _CONST(a \* b)
|
|
|
|
|
|
|
|
#else
|
|
|
|
/*
|
|
|
|
* Why not use the 'data16' and 'addr16' prefixes .. well, the
|
|
|
|
* assembler doesn't quite believe in real mode, and thus argues with
|
|
|
|
* us about what we're trying to do.
|
|
|
|
*/
|
|
|
|
#define D16 .byte 0x66;
|
|
|
|
#define A16 .byte 0x67;
|
|
|
|
|
|
|
|
#define _CONST(const) (const)
|
|
|
|
#define _BITNOT(const) ~_CONST(const)
|
|
|
|
#define _MUL(a, b) _CONST(a * b)
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*
|
|
|
|
* C pointers are different sizes between i386 and amd64.
|
|
|
|
* These constants can be used to compute offsets into pointer arrays.
|
|
|
|
*/
|
|
|
|
#if defined(__amd64)
|
|
|
|
#define CLONGSHIFT 3
|
|
|
|
#define CLONGSIZE 8
|
|
|
|
#define CLONGMASK 7
|
|
|
|
#elif defined(__i386)
|
|
|
|
#define CLONGSHIFT 2
|
|
|
|
#define CLONGSIZE 4
|
|
|
|
#define CLONGMASK 3
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Since we know we're either ILP32 or LP64 ..
|
|
|
|
*/
|
|
|
|
#define CPTRSHIFT CLONGSHIFT
|
|
|
|
#define CPTRSIZE CLONGSIZE
|
|
|
|
#define CPTRMASK CLONGMASK
|
|
|
|
|
|
|
|
#if CPTRSIZE != (1 << CPTRSHIFT) || CLONGSIZE != (1 << CLONGSHIFT)
|
|
|
|
#error "inconsistent shift constants"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if CPTRMASK != (CPTRSIZE - 1) || CLONGMASK != (CLONGSIZE - 1)
|
|
|
|
#error "inconsistent mask constants"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#define ASM_ENTRY_ALIGN 16
|
|
|
|
|
|
|
|
/*
|
|
|
|
* SSE register alignment and save areas
|
|
|
|
*/
|
|
|
|
|
|
|
|
#define XMM_SIZE 16
|
|
|
|
#define XMM_ALIGN 16
|
|
|
|
|
|
|
|
#if defined(__amd64)
|
|
|
|
|
|
|
|
#define SAVE_XMM_PROLOG(sreg, nreg) \
|
|
|
|
subq $_CONST(_MUL(XMM_SIZE, nreg)), %rsp; \
|
|
|
|
movq %rsp, sreg
|
|
|
|
|
|
|
|
#define RSTOR_XMM_EPILOG(sreg, nreg) \
|
|
|
|
addq $_CONST(_MUL(XMM_SIZE, nreg)), %rsp
|
|
|
|
|
|
|
|
#elif defined(__i386)
|
|
|
|
|
|
|
|
#define SAVE_XMM_PROLOG(sreg, nreg) \
|
|
|
|
subl $_CONST(_MUL(XMM_SIZE, nreg) + XMM_ALIGN), %esp; \
|
|
|
|
movl %esp, sreg; \
|
|
|
|
addl $XMM_ALIGN, sreg; \
|
|
|
|
andl $_BITNOT(XMM_ALIGN-1), sreg
|
|
|
|
|
|
|
|
#define RSTOR_XMM_EPILOG(sreg, nreg) \
|
|
|
|
addl $_CONST(_MUL(XMM_SIZE, nreg) + XMM_ALIGN), %esp;
|
|
|
|
|
|
|
|
#endif /* __i386 */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* profiling causes definitions of the MCOUNT and RTMCOUNT
|
|
|
|
* particular to the type
|
|
|
|
*/
|
|
|
|
#ifdef GPROF
|
|
|
|
|
|
|
|
#define MCOUNT(x) \
|
|
|
|
pushl %ebp; \
|
|
|
|
movl %esp, %ebp; \
|
|
|
|
call _mcount; \
|
|
|
|
popl %ebp
|
|
|
|
|
|
|
|
#endif /* GPROF */
|
|
|
|
|
|
|
|
#ifdef PROF
|
|
|
|
|
|
|
|
#define MCOUNT(x) \
|
|
|
|
/* CSTYLED */ \
|
|
|
|
.lcomm .L_/**/x/**/1, 4, 4; \
|
|
|
|
pushl %ebp; \
|
|
|
|
movl %esp, %ebp; \
|
|
|
|
/* CSTYLED */ \
|
|
|
|
movl $.L_/**/x/**/1, %edx; \
|
|
|
|
call _mcount; \
|
|
|
|
popl %ebp
|
|
|
|
|
|
|
|
#endif /* PROF */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* if we are not profiling, MCOUNT should be defined to nothing
|
|
|
|
*/
|
|
|
|
#if !defined(PROF) && !defined(GPROF)
|
|
|
|
#define MCOUNT(x)
|
|
|
|
#endif /* !defined(PROF) && !defined(GPROF) */
|
|
|
|
|
|
|
|
#define RTMCOUNT(x) MCOUNT(x)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Macro to define weak symbol aliases. These are similar to the ANSI-C
|
|
|
|
* #pragma weak _name = name
|
|
|
|
* except a compiler can determine type. The assembler must be told. Hence,
|
|
|
|
* the second parameter must be the type of the symbol (i.e.: function,...)
|
|
|
|
*/
|
|
|
|
#define ANSI_PRAGMA_WEAK(sym, stype) \
|
|
|
|
/* CSTYLED */ \
|
|
|
|
.weak _/**/sym; \
|
|
|
|
/* CSTYLED */ \
|
|
|
|
.type _/**/sym, @stype; \
|
|
|
|
/* CSTYLED */ \
|
|
|
|
_/**/sym = sym
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Like ANSI_PRAGMA_WEAK(), but for unrelated names, as in:
|
|
|
|
* #pragma weak sym1 = sym2
|
|
|
|
*/
|
|
|
|
#define ANSI_PRAGMA_WEAK2(sym1, sym2, stype) \
|
|
|
|
.weak sym1; \
|
|
|
|
.type sym1, @stype; \
|
|
|
|
sym1 = sym2
|
|
|
|
|
|
|
|
/*
|
|
|
|
* ENTRY provides the standard procedure entry code and an easy way to
|
|
|
|
* insert the calls to mcount for profiling. ENTRY_NP is identical, but
|
|
|
|
* never calls mcount.
|
|
|
|
*/
|
icp: properly fix all RETs in x86_64 Asm code
Commit 43569ee37420 ("Fix objtool: missing int3 after ret warning")
addressed replacing all `ret`s in x86 asm code to a macro in the
Linux kernel in order to enable SLS. That was done by copying the
upstream macro definitions and fixed objtool complaints.
Since then, several more mitigations were introduced, including
Rethunk. It requires to have a jump to one of the thunks in order
to work, so the RET macro was changed again. And, as ZFS code
didn't use the mainline defition, but copied it, this is currently
missing.
Objtool reminds about it time to time (Clang 16, CONFIG_RETHUNK=y):
fs/zfs/lua/zlua.o: warning: objtool: setjmp+0x25: 'naked' return
found in RETHUNK build
fs/zfs/lua/zlua.o: warning: objtool: longjmp+0x27: 'naked' return
found in RETHUNK build
Do it the following way:
* if we're building under Linux, unconditionally include
<linux/linkage.h> in the related files. It is available in x86
sources since even pre-2.6 times, so doesn't need any conftests;
* then, if RET macro is available, it will be used directly, so that
we will always have the version actual to the kernel we build;
* if there's no such macro, we define it as a simple `ret`, as it
was on pre-SLS times.
This ensures we always have the up-to-date definition with no need
to update it manually, and at the same time is safe for the whole
variety of kernels ZFS module supports.
Then, there's a couple more "naked" rets left in the code, they're
just defined as:
.byte 0xf3,0xc3
In fact, this is just:
rep ret
`rep ret` instead of just `ret` seems to mitigate performance issues
on some old AMD processors and most likely makes no sense as of
today.
Anyways, address those rets, so that they will be protected with
Rethunk and SLS. Include <sys/asm_linkage.h> here which now always
has RET definition and replace those constructs with just RET.
This wipes the last couple of places with unpatched rets objtool's
been complaining about.
Reviewed-by: Attila Fülöp <attila@fueloep.org>
Reviewed-by: Tino Reichardt <milky-zfs@mcmilk.de>
Reviewed-by: Richard Yao <richard.yao@alumni.stonybrook.edu>
Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov>
Signed-off-by: Alexander Lobakin <alobakin@pm.me>
Closes #14035
2022-10-16 17:53:22 +03:00
|
|
|
#undef ENTRY
|
2016-05-12 17:51:24 +03:00
|
|
|
#define ENTRY(x) \
|
|
|
|
.text; \
|
|
|
|
.align ASM_ENTRY_ALIGN; \
|
|
|
|
.globl x; \
|
|
|
|
.type x, @function; \
|
|
|
|
x: MCOUNT(x)
|
|
|
|
|
|
|
|
#define ENTRY_NP(x) \
|
|
|
|
.text; \
|
|
|
|
.align ASM_ENTRY_ALIGN; \
|
|
|
|
.globl x; \
|
|
|
|
.type x, @function; \
|
|
|
|
x:
|
|
|
|
|
|
|
|
#define RTENTRY(x) \
|
|
|
|
.text; \
|
|
|
|
.align ASM_ENTRY_ALIGN; \
|
|
|
|
.globl x; \
|
|
|
|
.type x, @function; \
|
|
|
|
x: RTMCOUNT(x)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* ENTRY2 is identical to ENTRY but provides two labels for the entry point.
|
|
|
|
*/
|
|
|
|
#define ENTRY2(x, y) \
|
|
|
|
.text; \
|
|
|
|
.align ASM_ENTRY_ALIGN; \
|
|
|
|
.globl x, y; \
|
|
|
|
.type x, @function; \
|
|
|
|
.type y, @function; \
|
|
|
|
/* CSTYLED */ \
|
|
|
|
x: ; \
|
|
|
|
y: MCOUNT(x)
|
|
|
|
|
|
|
|
#define ENTRY_NP2(x, y) \
|
|
|
|
.text; \
|
|
|
|
.align ASM_ENTRY_ALIGN; \
|
|
|
|
.globl x, y; \
|
|
|
|
.type x, @function; \
|
|
|
|
.type y, @function; \
|
|
|
|
/* CSTYLED */ \
|
|
|
|
x: ; \
|
|
|
|
y:
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
* ALTENTRY provides for additional entry points.
|
|
|
|
*/
|
|
|
|
#define ALTENTRY(x) \
|
|
|
|
.globl x; \
|
|
|
|
.type x, @function; \
|
|
|
|
x:
|
|
|
|
|
|
|
|
/*
|
|
|
|
* DGDEF and DGDEF2 provide global data declarations.
|
|
|
|
*
|
|
|
|
* DGDEF provides a word aligned word of storage.
|
|
|
|
*
|
|
|
|
* DGDEF2 allocates "sz" bytes of storage with **NO** alignment. This
|
|
|
|
* implies this macro is best used for byte arrays.
|
|
|
|
*
|
|
|
|
* DGDEF3 allocates "sz" bytes of storage with "algn" alignment.
|
|
|
|
*/
|
|
|
|
#define DGDEF2(name, sz) \
|
|
|
|
.data; \
|
|
|
|
.globl name; \
|
|
|
|
.type name, @object; \
|
|
|
|
.size name, sz; \
|
|
|
|
name:
|
|
|
|
|
|
|
|
#define DGDEF3(name, sz, algn) \
|
|
|
|
.data; \
|
|
|
|
.align algn; \
|
|
|
|
.globl name; \
|
|
|
|
.type name, @object; \
|
|
|
|
.size name, sz; \
|
|
|
|
name:
|
|
|
|
|
|
|
|
#define DGDEF(name) DGDEF3(name, 4, 4)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* SET_SIZE trails a function and set the size for the ELF symbol table.
|
|
|
|
*/
|
|
|
|
#define SET_SIZE(x) \
|
|
|
|
.size x, [.-x]
|
|
|
|
|
|
|
|
/*
|
|
|
|
* NWORD provides native word value.
|
|
|
|
*/
|
|
|
|
#if defined(__amd64)
|
|
|
|
|
|
|
|
/*CSTYLED*/
|
|
|
|
#define NWORD quad
|
|
|
|
|
|
|
|
#elif defined(__i386)
|
|
|
|
|
|
|
|
#define NWORD long
|
|
|
|
|
|
|
|
#endif /* __i386 */
|
|
|
|
|
|
|
|
#endif /* _ASM */
|
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#endif /* _IA32_SYS_ASM_LINKAGE_H */
|