about summary refs log tree commit diff
path: root/sysdeps/x86_64/dl-trampoline.S
blob: 87c5137837f01a634d883a1c858b60796e1f6eae (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
/* PLT trampolines.  x86-64 version.
   Copyright (C) 2004-2024 Free Software Foundation, Inc.
   This file is part of the GNU C Library.

   The GNU C Library is free software; you can redistribute it and/or
   modify it under the terms of the GNU Lesser General Public
   License as published by the Free Software Foundation; either
   version 2.1 of the License, or (at your option) any later version.

   The GNU C Library is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   Lesser General Public License for more details.

   You should have received a copy of the GNU Lesser General Public
   License along with the GNU C Library; if not, see
   <https://www.gnu.org/licenses/>.  */

#include <config.h>
#include <sysdep.h>
#include <cpu-features-offsets.h>
#include <features-offsets.h>
#include <link-defines.h>
#include <isa-level.h>
#include "dl-trampoline-save.h"

/* Area on stack to save and restore registers used for parameter
   passing when calling _dl_fixup.  */
#define REGISTER_SAVE_RAX	0
#define REGISTER_SAVE_RCX	(REGISTER_SAVE_RAX + 8)
#define REGISTER_SAVE_RDX	(REGISTER_SAVE_RCX + 8)
#define REGISTER_SAVE_RSI	(REGISTER_SAVE_RDX + 8)
#define REGISTER_SAVE_RDI	(REGISTER_SAVE_RSI + 8)
#define REGISTER_SAVE_R8	(REGISTER_SAVE_RDI + 8)
#define REGISTER_SAVE_R9	(REGISTER_SAVE_R8 + 8)

#define RESTORE_AVX

#ifdef SHARED
# define VEC_SIZE		64
# define VMOVA			vmovdqa64
# define VEC(i)			zmm##i
# define _dl_runtime_profile	_dl_runtime_profile_avx512
#  define SECTION(p)		p##.evex512
# include "dl-trampoline.h"
# undef _dl_runtime_profile
# undef VEC
# undef VMOVA
# undef VEC_SIZE
# undef SECTION

# if MINIMUM_X86_ISA_LEVEL <= AVX_X86_ISA_LEVEL
#  define VEC_SIZE		32
#  define VMOVA			vmovdqa
#  define VEC(i)			ymm##i
#  define SECTION(p)		p##.avx
#  define _dl_runtime_profile	_dl_runtime_profile_avx
#  include "dl-trampoline.h"
#  undef _dl_runtime_profile
#  undef VEC
#  undef VMOVA
#  undef VEC_SIZE
#  undef SECTION
# endif

# if MINIMUM_X86_ISA_LEVEL < AVX_X86_ISA_LEVEL
/* movaps/movups is 1-byte shorter.  */
#  define VEC_SIZE		16
#  define VMOVA			movaps
#  define VEC(i)			xmm##i
#  define _dl_runtime_profile	_dl_runtime_profile_sse
#  undef RESTORE_AVX
#  include "dl-trampoline.h"
#  undef _dl_runtime_profile
#  undef VEC
#  undef VMOVA
#  undef VEC_SIZE
# endif
#endif /* SHARED */

#if MINIMUM_X86_ISA_LEVEL < AVX_X86_ISA_LEVEL
# define USE_FXSAVE
# define STATE_SAVE_ALIGNMENT	16
# define _dl_runtime_resolve	_dl_runtime_resolve_fxsave
# include "dl-trampoline.h"
# undef _dl_runtime_resolve
# undef USE_FXSAVE
# undef STATE_SAVE_ALIGNMENT
#endif

#define USE_XSAVE
#define STATE_SAVE_ALIGNMENT	64
#define _dl_runtime_resolve	_dl_runtime_resolve_xsave
#include "dl-trampoline.h"
#undef _dl_runtime_resolve
#undef USE_XSAVE
#undef STATE_SAVE_ALIGNMENT

#define USE_XSAVEC
#define STATE_SAVE_ALIGNMENT	64
#define _dl_runtime_resolve	_dl_runtime_resolve_xsavec
#include "dl-trampoline.h"
#undef _dl_runtime_resolve
#undef USE_XSAVEC
#undef STATE_SAVE_ALIGNMENT