2017-12-18 15:30:13 +00:00
|
|
|
# SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note
|
|
|
|
#
|
|
|
|
# System call table for s390
|
|
|
|
#
|
|
|
|
# Format:
|
|
|
|
#
|
|
|
|
# <nr> <abi> <syscall> <entry-64bit> <compat-entry>
|
|
|
|
#
|
|
|
|
# where <abi> can be common, 64, or 32
|
|
|
|
|
|
|
|
1 common exit sys_exit sys_exit
|
|
|
|
2 common fork sys_fork sys_fork
|
|
|
|
3 common read sys_read compat_sys_s390_read
|
|
|
|
4 common write sys_write compat_sys_s390_write
|
|
|
|
5 common open sys_open compat_sys_open
|
|
|
|
6 common close sys_close sys_close
|
|
|
|
7 common restart_syscall sys_restart_syscall sys_restart_syscall
|
2019-01-16 13:15:23 +00:00
|
|
|
8 common creat sys_creat sys_creat
|
|
|
|
9 common link sys_link sys_link
|
|
|
|
10 common unlink sys_unlink sys_unlink
|
2017-12-18 15:30:13 +00:00
|
|
|
11 common execve sys_execve compat_sys_execve
|
2019-01-16 13:15:23 +00:00
|
|
|
12 common chdir sys_chdir sys_chdir
|
2019-01-06 23:33:08 +00:00
|
|
|
13 32 time - sys_time32
|
2019-01-16 13:15:23 +00:00
|
|
|
14 common mknod sys_mknod sys_mknod
|
|
|
|
15 common chmod sys_chmod sys_chmod
|
|
|
|
16 32 lchown - sys_lchown16
|
2017-12-18 15:30:13 +00:00
|
|
|
19 common lseek sys_lseek compat_sys_lseek
|
|
|
|
20 common getpid sys_getpid sys_getpid
|
2020-09-17 08:22:34 +00:00
|
|
|
21 common mount sys_mount sys_mount
|
2019-01-16 13:15:23 +00:00
|
|
|
22 common umount sys_oldumount sys_oldumount
|
|
|
|
23 32 setuid - sys_setuid16
|
2019-01-16 13:15:21 +00:00
|
|
|
24 32 getuid - sys_getuid16
|
2019-01-06 23:33:08 +00:00
|
|
|
25 32 stime - sys_stime32
|
2017-12-18 15:30:13 +00:00
|
|
|
26 common ptrace sys_ptrace compat_sys_ptrace
|
|
|
|
27 common alarm sys_alarm sys_alarm
|
|
|
|
29 common pause sys_pause sys_pause
|
2019-01-06 23:33:08 +00:00
|
|
|
30 common utime sys_utime sys_utime32
|
2019-01-16 13:15:23 +00:00
|
|
|
33 common access sys_access sys_access
|
2017-12-18 15:30:13 +00:00
|
|
|
34 common nice sys_nice sys_nice
|
|
|
|
36 common sync sys_sync sys_sync
|
|
|
|
37 common kill sys_kill sys_kill
|
2019-01-16 13:15:23 +00:00
|
|
|
38 common rename sys_rename sys_rename
|
|
|
|
39 common mkdir sys_mkdir sys_mkdir
|
|
|
|
40 common rmdir sys_rmdir sys_rmdir
|
2017-12-18 15:30:13 +00:00
|
|
|
41 common dup sys_dup sys_dup
|
2019-01-16 13:15:23 +00:00
|
|
|
42 common pipe sys_pipe sys_pipe
|
2017-12-18 15:30:13 +00:00
|
|
|
43 common times sys_times compat_sys_times
|
2019-01-16 13:15:23 +00:00
|
|
|
45 common brk sys_brk sys_brk
|
|
|
|
46 32 setgid - sys_setgid16
|
2019-01-16 13:15:21 +00:00
|
|
|
47 32 getgid - sys_getgid16
|
2019-01-16 13:15:23 +00:00
|
|
|
48 common signal sys_signal sys_signal
|
2019-01-16 13:15:21 +00:00
|
|
|
49 32 geteuid - sys_geteuid16
|
|
|
|
50 32 getegid - sys_getegid16
|
2019-01-16 13:15:23 +00:00
|
|
|
51 common acct sys_acct sys_acct
|
|
|
|
52 common umount2 sys_umount sys_umount
|
2017-12-18 15:30:13 +00:00
|
|
|
54 common ioctl sys_ioctl compat_sys_ioctl
|
|
|
|
55 common fcntl sys_fcntl compat_sys_fcntl
|
|
|
|
57 common setpgid sys_setpgid sys_setpgid
|
|
|
|
60 common umask sys_umask sys_umask
|
2019-01-16 13:15:23 +00:00
|
|
|
61 common chroot sys_chroot sys_chroot
|
2017-12-18 15:30:13 +00:00
|
|
|
62 common ustat sys_ustat compat_sys_ustat
|
|
|
|
63 common dup2 sys_dup2 sys_dup2
|
|
|
|
64 common getppid sys_getppid sys_getppid
|
|
|
|
65 common getpgrp sys_getpgrp sys_getpgrp
|
|
|
|
66 common setsid sys_setsid sys_setsid
|
|
|
|
67 common sigaction sys_sigaction compat_sys_sigaction
|
2019-01-16 13:15:23 +00:00
|
|
|
70 32 setreuid - sys_setreuid16
|
|
|
|
71 32 setregid - sys_setregid16
|
|
|
|
72 common sigsuspend sys_sigsuspend sys_sigsuspend
|
2017-12-18 15:30:13 +00:00
|
|
|
73 common sigpending sys_sigpending compat_sys_sigpending
|
2019-01-16 13:15:23 +00:00
|
|
|
74 common sethostname sys_sethostname sys_sethostname
|
2017-12-18 15:30:13 +00:00
|
|
|
75 common setrlimit sys_setrlimit compat_sys_setrlimit
|
|
|
|
76 32 getrlimit - compat_sys_old_getrlimit
|
|
|
|
77 common getrusage sys_getrusage compat_sys_getrusage
|
|
|
|
78 common gettimeofday sys_gettimeofday compat_sys_gettimeofday
|
|
|
|
79 common settimeofday sys_settimeofday compat_sys_settimeofday
|
2019-01-16 13:15:23 +00:00
|
|
|
80 32 getgroups - sys_getgroups16
|
|
|
|
81 32 setgroups - sys_setgroups16
|
|
|
|
83 common symlink sys_symlink sys_symlink
|
|
|
|
85 common readlink sys_readlink sys_readlink
|
|
|
|
86 common uselib sys_uselib sys_uselib
|
|
|
|
87 common swapon sys_swapon sys_swapon
|
|
|
|
88 common reboot sys_reboot sys_reboot
|
2017-12-18 15:30:13 +00:00
|
|
|
89 common readdir - compat_sys_old_readdir
|
|
|
|
90 common mmap sys_old_mmap compat_sys_s390_old_mmap
|
2019-01-16 13:15:23 +00:00
|
|
|
91 common munmap sys_munmap sys_munmap
|
2017-12-18 15:30:13 +00:00
|
|
|
92 common truncate sys_truncate compat_sys_truncate
|
|
|
|
93 common ftruncate sys_ftruncate compat_sys_ftruncate
|
|
|
|
94 common fchmod sys_fchmod sys_fchmod
|
2019-01-16 13:15:23 +00:00
|
|
|
95 32 fchown - sys_fchown16
|
2017-12-18 15:30:13 +00:00
|
|
|
96 common getpriority sys_getpriority sys_getpriority
|
|
|
|
97 common setpriority sys_setpriority sys_setpriority
|
|
|
|
99 common statfs sys_statfs compat_sys_statfs
|
|
|
|
100 common fstatfs sys_fstatfs compat_sys_fstatfs
|
|
|
|
101 32 ioperm - -
|
|
|
|
102 common socketcall sys_socketcall compat_sys_socketcall
|
2019-01-16 13:15:23 +00:00
|
|
|
103 common syslog sys_syslog sys_syslog
|
2017-12-18 15:30:13 +00:00
|
|
|
104 common setitimer sys_setitimer compat_sys_setitimer
|
|
|
|
105 common getitimer sys_getitimer compat_sys_getitimer
|
|
|
|
106 common stat sys_newstat compat_sys_newstat
|
|
|
|
107 common lstat sys_newlstat compat_sys_newlstat
|
|
|
|
108 common fstat sys_newfstat compat_sys_newfstat
|
2023-07-10 18:51:24 +00:00
|
|
|
110 common lookup_dcookie - -
|
2017-12-18 15:30:13 +00:00
|
|
|
111 common vhangup sys_vhangup sys_vhangup
|
|
|
|
112 common idle - -
|
|
|
|
114 common wait4 sys_wait4 compat_sys_wait4
|
2019-01-16 13:15:23 +00:00
|
|
|
115 common swapoff sys_swapoff sys_swapoff
|
2017-12-18 15:30:13 +00:00
|
|
|
116 common sysinfo sys_sysinfo compat_sys_sysinfo
|
|
|
|
117 common ipc sys_s390_ipc compat_sys_s390_ipc
|
|
|
|
118 common fsync sys_fsync sys_fsync
|
|
|
|
119 common sigreturn sys_sigreturn compat_sys_sigreturn
|
2019-01-16 13:15:23 +00:00
|
|
|
120 common clone sys_clone sys_clone
|
|
|
|
121 common setdomainname sys_setdomainname sys_setdomainname
|
|
|
|
122 common uname sys_newuname sys_newuname
|
2019-01-06 23:33:08 +00:00
|
|
|
124 common adjtimex sys_adjtimex sys_adjtimex_time32
|
2019-01-16 13:15:23 +00:00
|
|
|
125 common mprotect sys_mprotect sys_mprotect
|
2017-12-18 15:30:13 +00:00
|
|
|
126 common sigprocmask sys_sigprocmask compat_sys_sigprocmask
|
|
|
|
127 common create_module - -
|
2019-01-16 13:15:23 +00:00
|
|
|
128 common init_module sys_init_module sys_init_module
|
|
|
|
129 common delete_module sys_delete_module sys_delete_module
|
2017-12-18 15:30:13 +00:00
|
|
|
130 common get_kernel_syms - -
|
2019-01-16 13:15:23 +00:00
|
|
|
131 common quotactl sys_quotactl sys_quotactl
|
2017-12-18 15:30:13 +00:00
|
|
|
132 common getpgid sys_getpgid sys_getpgid
|
|
|
|
133 common fchdir sys_fchdir sys_fchdir
|
2021-06-29 20:11:44 +00:00
|
|
|
134 common bdflush sys_ni_syscall sys_ni_syscall
|
2019-01-16 13:15:23 +00:00
|
|
|
135 common sysfs sys_sysfs sys_sysfs
|
2017-12-18 15:30:13 +00:00
|
|
|
136 common personality sys_s390_personality sys_s390_personality
|
|
|
|
137 common afs_syscall - -
|
2019-01-16 13:15:23 +00:00
|
|
|
138 32 setfsuid - sys_setfsuid16
|
|
|
|
139 32 setfsgid - sys_setfsgid16
|
|
|
|
140 32 _llseek - sys_llseek
|
2017-12-18 15:30:13 +00:00
|
|
|
141 common getdents sys_getdents compat_sys_getdents
|
|
|
|
142 32 _newselect - compat_sys_select
|
|
|
|
142 64 select sys_select -
|
|
|
|
143 common flock sys_flock sys_flock
|
2019-01-16 13:15:23 +00:00
|
|
|
144 common msync sys_msync sys_msync
|
2020-09-25 04:51:43 +00:00
|
|
|
145 common readv sys_readv sys_readv
|
|
|
|
146 common writev sys_writev sys_writev
|
2017-12-18 15:30:13 +00:00
|
|
|
147 common getsid sys_getsid sys_getsid
|
|
|
|
148 common fdatasync sys_fdatasync sys_fdatasync
|
2020-08-15 00:31:07 +00:00
|
|
|
149 common _sysctl - -
|
2019-01-16 13:15:23 +00:00
|
|
|
150 common mlock sys_mlock sys_mlock
|
|
|
|
151 common munlock sys_munlock sys_munlock
|
2017-12-18 15:30:13 +00:00
|
|
|
152 common mlockall sys_mlockall sys_mlockall
|
|
|
|
153 common munlockall sys_munlockall sys_munlockall
|
2019-01-16 13:15:23 +00:00
|
|
|
154 common sched_setparam sys_sched_setparam sys_sched_setparam
|
|
|
|
155 common sched_getparam sys_sched_getparam sys_sched_getparam
|
|
|
|
156 common sched_setscheduler sys_sched_setscheduler sys_sched_setscheduler
|
2017-12-18 15:30:13 +00:00
|
|
|
157 common sched_getscheduler sys_sched_getscheduler sys_sched_getscheduler
|
|
|
|
158 common sched_yield sys_sched_yield sys_sched_yield
|
|
|
|
159 common sched_get_priority_max sys_sched_get_priority_max sys_sched_get_priority_max
|
|
|
|
160 common sched_get_priority_min sys_sched_get_priority_min sys_sched_get_priority_min
|
2019-01-06 23:33:08 +00:00
|
|
|
161 common sched_rr_get_interval sys_sched_rr_get_interval sys_sched_rr_get_interval_time32
|
|
|
|
162 common nanosleep sys_nanosleep sys_nanosleep_time32
|
2019-01-16 13:15:23 +00:00
|
|
|
163 common mremap sys_mremap sys_mremap
|
|
|
|
164 32 setresuid - sys_setresuid16
|
|
|
|
165 32 getresuid - sys_getresuid16
|
2017-12-18 15:30:13 +00:00
|
|
|
167 common query_module - -
|
2019-01-16 13:15:23 +00:00
|
|
|
168 common poll sys_poll sys_poll
|
2017-12-18 15:30:13 +00:00
|
|
|
169 common nfsservctl - -
|
2019-01-16 13:15:23 +00:00
|
|
|
170 32 setresgid - sys_setresgid16
|
|
|
|
171 32 getresgid - sys_getresgid16
|
|
|
|
172 common prctl sys_prctl sys_prctl
|
2017-12-18 15:30:13 +00:00
|
|
|
173 common rt_sigreturn sys_rt_sigreturn compat_sys_rt_sigreturn
|
|
|
|
174 common rt_sigaction sys_rt_sigaction compat_sys_rt_sigaction
|
|
|
|
175 common rt_sigprocmask sys_rt_sigprocmask compat_sys_rt_sigprocmask
|
|
|
|
176 common rt_sigpending sys_rt_sigpending compat_sys_rt_sigpending
|
2019-01-06 23:33:08 +00:00
|
|
|
177 common rt_sigtimedwait sys_rt_sigtimedwait compat_sys_rt_sigtimedwait_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
178 common rt_sigqueueinfo sys_rt_sigqueueinfo compat_sys_rt_sigqueueinfo
|
|
|
|
179 common rt_sigsuspend sys_rt_sigsuspend compat_sys_rt_sigsuspend
|
|
|
|
180 common pread64 sys_pread64 compat_sys_s390_pread64
|
|
|
|
181 common pwrite64 sys_pwrite64 compat_sys_s390_pwrite64
|
2019-01-16 13:15:23 +00:00
|
|
|
182 32 chown - sys_chown16
|
|
|
|
183 common getcwd sys_getcwd sys_getcwd
|
|
|
|
184 common capget sys_capget sys_capget
|
|
|
|
185 common capset sys_capset sys_capset
|
2017-12-18 15:30:13 +00:00
|
|
|
186 common sigaltstack sys_sigaltstack compat_sys_sigaltstack
|
|
|
|
187 common sendfile sys_sendfile64 compat_sys_sendfile
|
|
|
|
188 common getpmsg - -
|
|
|
|
189 common putpmsg - -
|
|
|
|
190 common vfork sys_vfork sys_vfork
|
|
|
|
191 32 ugetrlimit - compat_sys_getrlimit
|
|
|
|
191 64 getrlimit sys_getrlimit -
|
|
|
|
192 32 mmap2 - compat_sys_s390_mmap2
|
|
|
|
193 32 truncate64 - compat_sys_s390_truncate64
|
|
|
|
194 32 ftruncate64 - compat_sys_s390_ftruncate64
|
|
|
|
195 32 stat64 - compat_sys_s390_stat64
|
|
|
|
196 32 lstat64 - compat_sys_s390_lstat64
|
|
|
|
197 32 fstat64 - compat_sys_s390_fstat64
|
2019-01-16 13:15:23 +00:00
|
|
|
198 32 lchown32 - sys_lchown
|
2017-12-18 15:30:13 +00:00
|
|
|
198 64 lchown sys_lchown -
|
|
|
|
199 32 getuid32 - sys_getuid
|
|
|
|
199 64 getuid sys_getuid -
|
|
|
|
200 32 getgid32 - sys_getgid
|
|
|
|
200 64 getgid sys_getgid -
|
|
|
|
201 32 geteuid32 - sys_geteuid
|
|
|
|
201 64 geteuid sys_geteuid -
|
|
|
|
202 32 getegid32 - sys_getegid
|
|
|
|
202 64 getegid sys_getegid -
|
|
|
|
203 32 setreuid32 - sys_setreuid
|
|
|
|
203 64 setreuid sys_setreuid -
|
|
|
|
204 32 setregid32 - sys_setregid
|
|
|
|
204 64 setregid sys_setregid -
|
2019-01-16 13:15:23 +00:00
|
|
|
205 32 getgroups32 - sys_getgroups
|
2017-12-18 15:30:13 +00:00
|
|
|
205 64 getgroups sys_getgroups -
|
2019-01-16 13:15:23 +00:00
|
|
|
206 32 setgroups32 - sys_setgroups
|
2017-12-18 15:30:13 +00:00
|
|
|
206 64 setgroups sys_setgroups -
|
|
|
|
207 32 fchown32 - sys_fchown
|
|
|
|
207 64 fchown sys_fchown -
|
|
|
|
208 32 setresuid32 - sys_setresuid
|
|
|
|
208 64 setresuid sys_setresuid -
|
2019-01-16 13:15:23 +00:00
|
|
|
209 32 getresuid32 - sys_getresuid
|
2017-12-18 15:30:13 +00:00
|
|
|
209 64 getresuid sys_getresuid -
|
|
|
|
210 32 setresgid32 - sys_setresgid
|
|
|
|
210 64 setresgid sys_setresgid -
|
2019-01-16 13:15:23 +00:00
|
|
|
211 32 getresgid32 - sys_getresgid
|
2017-12-18 15:30:13 +00:00
|
|
|
211 64 getresgid sys_getresgid -
|
2019-01-16 13:15:23 +00:00
|
|
|
212 32 chown32 - sys_chown
|
2017-12-18 15:30:13 +00:00
|
|
|
212 64 chown sys_chown -
|
|
|
|
213 32 setuid32 - sys_setuid
|
|
|
|
213 64 setuid sys_setuid -
|
|
|
|
214 32 setgid32 - sys_setgid
|
|
|
|
214 64 setgid sys_setgid -
|
|
|
|
215 32 setfsuid32 - sys_setfsuid
|
|
|
|
215 64 setfsuid sys_setfsuid -
|
|
|
|
216 32 setfsgid32 - sys_setfsgid
|
|
|
|
216 64 setfsgid sys_setfsgid -
|
2019-01-16 13:15:23 +00:00
|
|
|
217 common pivot_root sys_pivot_root sys_pivot_root
|
|
|
|
218 common mincore sys_mincore sys_mincore
|
|
|
|
219 common madvise sys_madvise sys_madvise
|
|
|
|
220 common getdents64 sys_getdents64 sys_getdents64
|
2017-12-18 15:30:13 +00:00
|
|
|
221 32 fcntl64 - compat_sys_fcntl64
|
|
|
|
222 common readahead sys_readahead compat_sys_s390_readahead
|
|
|
|
223 32 sendfile64 - compat_sys_sendfile64
|
2019-01-16 13:15:23 +00:00
|
|
|
224 common setxattr sys_setxattr sys_setxattr
|
|
|
|
225 common lsetxattr sys_lsetxattr sys_lsetxattr
|
|
|
|
226 common fsetxattr sys_fsetxattr sys_fsetxattr
|
|
|
|
227 common getxattr sys_getxattr sys_getxattr
|
|
|
|
228 common lgetxattr sys_lgetxattr sys_lgetxattr
|
|
|
|
229 common fgetxattr sys_fgetxattr sys_fgetxattr
|
|
|
|
230 common listxattr sys_listxattr sys_listxattr
|
|
|
|
231 common llistxattr sys_llistxattr sys_llistxattr
|
|
|
|
232 common flistxattr sys_flistxattr sys_flistxattr
|
|
|
|
233 common removexattr sys_removexattr sys_removexattr
|
|
|
|
234 common lremovexattr sys_lremovexattr sys_lremovexattr
|
|
|
|
235 common fremovexattr sys_fremovexattr sys_fremovexattr
|
2017-12-18 15:30:13 +00:00
|
|
|
236 common gettid sys_gettid sys_gettid
|
|
|
|
237 common tkill sys_tkill sys_tkill
|
2019-01-06 23:33:08 +00:00
|
|
|
238 common futex sys_futex sys_futex_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
239 common sched_setaffinity sys_sched_setaffinity compat_sys_sched_setaffinity
|
|
|
|
240 common sched_getaffinity sys_sched_getaffinity compat_sys_sched_getaffinity
|
|
|
|
241 common tgkill sys_tgkill sys_tgkill
|
|
|
|
243 common io_setup sys_io_setup compat_sys_io_setup
|
2019-01-16 13:15:23 +00:00
|
|
|
244 common io_destroy sys_io_destroy sys_io_destroy
|
2019-01-06 23:33:08 +00:00
|
|
|
245 common io_getevents sys_io_getevents sys_io_getevents_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
246 common io_submit sys_io_submit compat_sys_io_submit
|
2019-01-16 13:15:23 +00:00
|
|
|
247 common io_cancel sys_io_cancel sys_io_cancel
|
2017-12-18 15:30:13 +00:00
|
|
|
248 common exit_group sys_exit_group sys_exit_group
|
|
|
|
249 common epoll_create sys_epoll_create sys_epoll_create
|
2019-01-16 13:15:23 +00:00
|
|
|
250 common epoll_ctl sys_epoll_ctl sys_epoll_ctl
|
|
|
|
251 common epoll_wait sys_epoll_wait sys_epoll_wait
|
|
|
|
252 common set_tid_address sys_set_tid_address sys_set_tid_address
|
2017-12-18 15:30:13 +00:00
|
|
|
253 common fadvise64 sys_fadvise64_64 compat_sys_s390_fadvise64
|
|
|
|
254 common timer_create sys_timer_create compat_sys_timer_create
|
2019-01-06 23:33:08 +00:00
|
|
|
255 common timer_settime sys_timer_settime sys_timer_settime32
|
|
|
|
256 common timer_gettime sys_timer_gettime sys_timer_gettime32
|
2017-12-18 15:30:13 +00:00
|
|
|
257 common timer_getoverrun sys_timer_getoverrun sys_timer_getoverrun
|
|
|
|
258 common timer_delete sys_timer_delete sys_timer_delete
|
2019-01-06 23:33:08 +00:00
|
|
|
259 common clock_settime sys_clock_settime sys_clock_settime32
|
|
|
|
260 common clock_gettime sys_clock_gettime sys_clock_gettime32
|
|
|
|
261 common clock_getres sys_clock_getres sys_clock_getres_time32
|
|
|
|
262 common clock_nanosleep sys_clock_nanosleep sys_clock_nanosleep_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
264 32 fadvise64_64 - compat_sys_s390_fadvise64_64
|
|
|
|
265 common statfs64 sys_statfs64 compat_sys_statfs64
|
|
|
|
266 common fstatfs64 sys_fstatfs64 compat_sys_fstatfs64
|
2019-01-16 13:15:23 +00:00
|
|
|
267 common remap_file_pages sys_remap_file_pages sys_remap_file_pages
|
2021-09-08 22:18:25 +00:00
|
|
|
268 common mbind sys_mbind sys_mbind
|
|
|
|
269 common get_mempolicy sys_get_mempolicy sys_get_mempolicy
|
|
|
|
270 common set_mempolicy sys_set_mempolicy sys_set_mempolicy
|
2017-12-18 15:30:13 +00:00
|
|
|
271 common mq_open sys_mq_open compat_sys_mq_open
|
2019-01-16 13:15:23 +00:00
|
|
|
272 common mq_unlink sys_mq_unlink sys_mq_unlink
|
2019-01-06 23:33:08 +00:00
|
|
|
273 common mq_timedsend sys_mq_timedsend sys_mq_timedsend_time32
|
|
|
|
274 common mq_timedreceive sys_mq_timedreceive sys_mq_timedreceive_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
275 common mq_notify sys_mq_notify compat_sys_mq_notify
|
|
|
|
276 common mq_getsetattr sys_mq_getsetattr compat_sys_mq_getsetattr
|
|
|
|
277 common kexec_load sys_kexec_load compat_sys_kexec_load
|
2019-01-16 13:15:23 +00:00
|
|
|
278 common add_key sys_add_key sys_add_key
|
|
|
|
279 common request_key sys_request_key sys_request_key
|
2017-12-18 15:30:13 +00:00
|
|
|
280 common keyctl sys_keyctl compat_sys_keyctl
|
|
|
|
281 common waitid sys_waitid compat_sys_waitid
|
|
|
|
282 common ioprio_set sys_ioprio_set sys_ioprio_set
|
|
|
|
283 common ioprio_get sys_ioprio_get sys_ioprio_get
|
|
|
|
284 common inotify_init sys_inotify_init sys_inotify_init
|
2019-01-16 13:15:23 +00:00
|
|
|
285 common inotify_add_watch sys_inotify_add_watch sys_inotify_add_watch
|
2017-12-18 15:30:13 +00:00
|
|
|
286 common inotify_rm_watch sys_inotify_rm_watch sys_inotify_rm_watch
|
2021-09-08 22:18:25 +00:00
|
|
|
287 common migrate_pages sys_migrate_pages sys_migrate_pages
|
2017-12-18 15:30:13 +00:00
|
|
|
288 common openat sys_openat compat_sys_openat
|
2019-01-16 13:15:23 +00:00
|
|
|
289 common mkdirat sys_mkdirat sys_mkdirat
|
|
|
|
290 common mknodat sys_mknodat sys_mknodat
|
|
|
|
291 common fchownat sys_fchownat sys_fchownat
|
2019-01-06 23:33:08 +00:00
|
|
|
292 common futimesat sys_futimesat sys_futimesat_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
293 32 fstatat64 - compat_sys_s390_fstatat64
|
|
|
|
293 64 newfstatat sys_newfstatat -
|
2019-01-16 13:15:23 +00:00
|
|
|
294 common unlinkat sys_unlinkat sys_unlinkat
|
|
|
|
295 common renameat sys_renameat sys_renameat
|
|
|
|
296 common linkat sys_linkat sys_linkat
|
|
|
|
297 common symlinkat sys_symlinkat sys_symlinkat
|
|
|
|
298 common readlinkat sys_readlinkat sys_readlinkat
|
|
|
|
299 common fchmodat sys_fchmodat sys_fchmodat
|
|
|
|
300 common faccessat sys_faccessat sys_faccessat
|
2019-01-06 23:33:08 +00:00
|
|
|
301 common pselect6 sys_pselect6 compat_sys_pselect6_time32
|
|
|
|
302 common ppoll sys_ppoll compat_sys_ppoll_time32
|
2019-01-16 13:15:23 +00:00
|
|
|
303 common unshare sys_unshare sys_unshare
|
2017-12-18 15:30:13 +00:00
|
|
|
304 common set_robust_list sys_set_robust_list compat_sys_set_robust_list
|
|
|
|
305 common get_robust_list sys_get_robust_list compat_sys_get_robust_list
|
2019-01-16 13:15:23 +00:00
|
|
|
306 common splice sys_splice sys_splice
|
2017-12-18 15:30:13 +00:00
|
|
|
307 common sync_file_range sys_sync_file_range compat_sys_s390_sync_file_range
|
2019-01-16 13:15:23 +00:00
|
|
|
308 common tee sys_tee sys_tee
|
2020-09-25 04:51:44 +00:00
|
|
|
309 common vmsplice sys_vmsplice sys_vmsplice
|
2021-09-08 22:18:25 +00:00
|
|
|
310 common move_pages sys_move_pages sys_move_pages
|
2019-01-16 13:15:23 +00:00
|
|
|
311 common getcpu sys_getcpu sys_getcpu
|
2017-12-18 15:30:13 +00:00
|
|
|
312 common epoll_pwait sys_epoll_pwait compat_sys_epoll_pwait
|
2019-01-06 23:33:08 +00:00
|
|
|
313 common utimes sys_utimes sys_utimes_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
314 common fallocate sys_fallocate compat_sys_s390_fallocate
|
2019-01-06 23:33:08 +00:00
|
|
|
315 common utimensat sys_utimensat sys_utimensat_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
316 common signalfd sys_signalfd compat_sys_signalfd
|
|
|
|
317 common timerfd - -
|
|
|
|
318 common eventfd sys_eventfd sys_eventfd
|
|
|
|
319 common timerfd_create sys_timerfd_create sys_timerfd_create
|
2019-01-06 23:33:08 +00:00
|
|
|
320 common timerfd_settime sys_timerfd_settime sys_timerfd_settime32
|
|
|
|
321 common timerfd_gettime sys_timerfd_gettime sys_timerfd_gettime32
|
2017-12-18 15:30:13 +00:00
|
|
|
322 common signalfd4 sys_signalfd4 compat_sys_signalfd4
|
|
|
|
323 common eventfd2 sys_eventfd2 sys_eventfd2
|
|
|
|
324 common inotify_init1 sys_inotify_init1 sys_inotify_init1
|
2019-01-16 13:15:23 +00:00
|
|
|
325 common pipe2 sys_pipe2 sys_pipe2
|
2017-12-18 15:30:13 +00:00
|
|
|
326 common dup3 sys_dup3 sys_dup3
|
|
|
|
327 common epoll_create1 sys_epoll_create1 sys_epoll_create1
|
|
|
|
328 common preadv sys_preadv compat_sys_preadv
|
|
|
|
329 common pwritev sys_pwritev compat_sys_pwritev
|
|
|
|
330 common rt_tgsigqueueinfo sys_rt_tgsigqueueinfo compat_sys_rt_tgsigqueueinfo
|
2019-01-16 13:15:23 +00:00
|
|
|
331 common perf_event_open sys_perf_event_open sys_perf_event_open
|
2017-12-18 15:30:13 +00:00
|
|
|
332 common fanotify_init sys_fanotify_init sys_fanotify_init
|
|
|
|
333 common fanotify_mark sys_fanotify_mark compat_sys_fanotify_mark
|
2019-01-16 13:15:23 +00:00
|
|
|
334 common prlimit64 sys_prlimit64 sys_prlimit64
|
|
|
|
335 common name_to_handle_at sys_name_to_handle_at sys_name_to_handle_at
|
2017-12-18 15:30:13 +00:00
|
|
|
336 common open_by_handle_at sys_open_by_handle_at compat_sys_open_by_handle_at
|
2019-01-06 23:33:08 +00:00
|
|
|
337 common clock_adjtime sys_clock_adjtime sys_clock_adjtime32
|
2017-12-18 15:30:13 +00:00
|
|
|
338 common syncfs sys_syncfs sys_syncfs
|
|
|
|
339 common setns sys_setns sys_setns
|
2020-09-25 04:51:45 +00:00
|
|
|
340 common process_vm_readv sys_process_vm_readv sys_process_vm_readv
|
|
|
|
341 common process_vm_writev sys_process_vm_writev sys_process_vm_writev
|
2017-12-18 15:30:13 +00:00
|
|
|
342 common s390_runtime_instr sys_s390_runtime_instr sys_s390_runtime_instr
|
2019-01-16 13:15:23 +00:00
|
|
|
343 common kcmp sys_kcmp sys_kcmp
|
|
|
|
344 common finit_module sys_finit_module sys_finit_module
|
|
|
|
345 common sched_setattr sys_sched_setattr sys_sched_setattr
|
|
|
|
346 common sched_getattr sys_sched_getattr sys_sched_getattr
|
|
|
|
347 common renameat2 sys_renameat2 sys_renameat2
|
|
|
|
348 common seccomp sys_seccomp sys_seccomp
|
|
|
|
349 common getrandom sys_getrandom sys_getrandom
|
|
|
|
350 common memfd_create sys_memfd_create sys_memfd_create
|
|
|
|
351 common bpf sys_bpf sys_bpf
|
|
|
|
352 common s390_pci_mmio_write sys_s390_pci_mmio_write sys_s390_pci_mmio_write
|
|
|
|
353 common s390_pci_mmio_read sys_s390_pci_mmio_read sys_s390_pci_mmio_read
|
2017-12-18 15:30:13 +00:00
|
|
|
354 common execveat sys_execveat compat_sys_execveat
|
|
|
|
355 common userfaultfd sys_userfaultfd sys_userfaultfd
|
|
|
|
356 common membarrier sys_membarrier sys_membarrier
|
2019-01-06 23:33:08 +00:00
|
|
|
357 common recvmmsg sys_recvmmsg compat_sys_recvmmsg_time32
|
2017-12-18 15:30:13 +00:00
|
|
|
358 common sendmmsg sys_sendmmsg compat_sys_sendmmsg
|
|
|
|
359 common socket sys_socket sys_socket
|
2019-01-16 13:15:23 +00:00
|
|
|
360 common socketpair sys_socketpair sys_socketpair
|
|
|
|
361 common bind sys_bind sys_bind
|
|
|
|
362 common connect sys_connect sys_connect
|
2017-12-18 15:30:13 +00:00
|
|
|
363 common listen sys_listen sys_listen
|
2019-01-16 13:15:23 +00:00
|
|
|
364 common accept4 sys_accept4 sys_accept4
|
2020-07-17 06:23:15 +00:00
|
|
|
365 common getsockopt sys_getsockopt sys_getsockopt
|
|
|
|
366 common setsockopt sys_setsockopt sys_setsockopt
|
2019-01-16 13:15:23 +00:00
|
|
|
367 common getsockname sys_getsockname sys_getsockname
|
|
|
|
368 common getpeername sys_getpeername sys_getpeername
|
|
|
|
369 common sendto sys_sendto sys_sendto
|
2017-12-18 15:30:13 +00:00
|
|
|
370 common sendmsg sys_sendmsg compat_sys_sendmsg
|
|
|
|
371 common recvfrom sys_recvfrom compat_sys_recvfrom
|
|
|
|
372 common recvmsg sys_recvmsg compat_sys_recvmsg
|
|
|
|
373 common shutdown sys_shutdown sys_shutdown
|
2019-01-16 13:15:23 +00:00
|
|
|
374 common mlock2 sys_mlock2 sys_mlock2
|
|
|
|
375 common copy_file_range sys_copy_file_range sys_copy_file_range
|
2017-12-18 15:30:13 +00:00
|
|
|
376 common preadv2 sys_preadv2 compat_sys_preadv2
|
|
|
|
377 common pwritev2 sys_pwritev2 compat_sys_pwritev2
|
2019-01-16 13:15:23 +00:00
|
|
|
378 common s390_guarded_storage sys_s390_guarded_storage sys_s390_guarded_storage
|
|
|
|
379 common statx sys_statx sys_statx
|
|
|
|
380 common s390_sthyi sys_s390_sthyi sys_s390_sthyi
|
|
|
|
381 common kexec_file_load sys_kexec_file_load sys_kexec_file_load
|
2018-06-30 08:53:57 +00:00
|
|
|
382 common io_pgetevents sys_io_pgetevents compat_sys_io_pgetevents
|
2019-01-16 13:15:23 +00:00
|
|
|
383 common rseq sys_rseq sys_rseq
|
2018-12-31 22:12:32 +00:00
|
|
|
384 common pkey_mprotect sys_pkey_mprotect sys_pkey_mprotect
|
|
|
|
385 common pkey_alloc sys_pkey_alloc sys_pkey_alloc
|
|
|
|
386 common pkey_free sys_pkey_free sys_pkey_free
|
2018-12-31 13:38:26 +00:00
|
|
|
# room for arch specific syscalls
|
|
|
|
392 64 semtimedop sys_semtimedop -
|
|
|
|
393 common semget sys_semget sys_semget
|
|
|
|
394 common semctl sys_semctl compat_sys_semctl
|
|
|
|
395 common shmget sys_shmget sys_shmget
|
|
|
|
396 common shmctl sys_shmctl compat_sys_shmctl
|
|
|
|
397 common shmat sys_shmat compat_sys_shmat
|
|
|
|
398 common shmdt sys_shmdt sys_shmdt
|
|
|
|
399 common msgget sys_msgget sys_msgget
|
|
|
|
400 common msgsnd sys_msgsnd compat_sys_msgsnd
|
|
|
|
401 common msgrcv sys_msgrcv compat_sys_msgrcv
|
|
|
|
402 common msgctl sys_msgctl compat_sys_msgctl
|
2019-01-10 11:45:11 +00:00
|
|
|
403 32 clock_gettime64 - sys_clock_gettime
|
|
|
|
404 32 clock_settime64 - sys_clock_settime
|
|
|
|
405 32 clock_adjtime64 - sys_clock_adjtime
|
|
|
|
406 32 clock_getres_time64 - sys_clock_getres
|
|
|
|
407 32 clock_nanosleep_time64 - sys_clock_nanosleep
|
|
|
|
408 32 timer_gettime64 - sys_timer_gettime
|
|
|
|
409 32 timer_settime64 - sys_timer_settime
|
|
|
|
410 32 timerfd_gettime64 - sys_timerfd_gettime
|
|
|
|
411 32 timerfd_settime64 - sys_timerfd_settime
|
|
|
|
412 32 utimensat_time64 - sys_utimensat
|
|
|
|
413 32 pselect6_time64 - compat_sys_pselect6_time64
|
|
|
|
414 32 ppoll_time64 - compat_sys_ppoll_time64
|
|
|
|
416 32 io_pgetevents_time64 - sys_io_pgetevents
|
|
|
|
417 32 recvmmsg_time64 - compat_sys_recvmmsg_time64
|
|
|
|
418 32 mq_timedsend_time64 - sys_mq_timedsend
|
|
|
|
419 32 mq_timedreceive_time64 - sys_mq_timedreceive
|
|
|
|
420 32 semtimedop_time64 - sys_semtimedop
|
|
|
|
421 32 rt_sigtimedwait_time64 - compat_sys_rt_sigtimedwait_time64
|
|
|
|
422 32 futex_time64 - sys_futex
|
|
|
|
423 32 sched_rr_get_interval_time64 - sys_sched_rr_get_interval
|
2019-02-28 12:59:19 +00:00
|
|
|
424 common pidfd_send_signal sys_pidfd_send_signal sys_pidfd_send_signal
|
|
|
|
425 common io_uring_setup sys_io_uring_setup sys_io_uring_setup
|
|
|
|
426 common io_uring_enter sys_io_uring_enter sys_io_uring_enter
|
|
|
|
427 common io_uring_register sys_io_uring_register sys_io_uring_register
|
2019-05-16 11:52:34 +00:00
|
|
|
428 common open_tree sys_open_tree sys_open_tree
|
|
|
|
429 common move_mount sys_move_mount sys_move_mount
|
|
|
|
430 common fsopen sys_fsopen sys_fsopen
|
|
|
|
431 common fsconfig sys_fsconfig sys_fsconfig
|
|
|
|
432 common fsmount sys_fsmount sys_fsmount
|
|
|
|
433 common fspick sys_fspick sys_fspick
|
2019-05-24 10:44:59 +00:00
|
|
|
434 common pidfd_open sys_pidfd_open sys_pidfd_open
|
s390: wire up clone3 system call
Tested (64-bit and compat mode) using program from
http://lkml.kernel.org/r/20190604212930.jaaztvkent32b7d3@brauner.io
with the following:
return syscall(__NR_clone, flags, 0, pidfd, 0, 0);
changed to:
return syscall(__NR_clone, 0, flags, pidfd, 0, 0);
due to CLONE_BACKWARDS2.
Signed-off-by: Vasily Gorbik <gor@linux.ibm.com>
Acked-by: Christian Borntraeger <borntraeger@de.ibm.com>
Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com>
2019-07-14 18:49:23 +00:00
|
|
|
435 common clone3 sys_clone3 sys_clone3
|
2019-05-24 09:31:44 +00:00
|
|
|
436 common close_range sys_close_range sys_close_range
|
open: introduce openat2(2) syscall
/* Background. */
For a very long time, extending openat(2) with new features has been
incredibly frustrating. This stems from the fact that openat(2) is
possibly the most famous counter-example to the mantra "don't silently
accept garbage from userspace" -- it doesn't check whether unknown flags
are present[1].
This means that (generally) the addition of new flags to openat(2) has
been fraught with backwards-compatibility issues (O_TMPFILE has to be
defined as __O_TMPFILE|O_DIRECTORY|[O_RDWR or O_WRONLY] to ensure old
kernels gave errors, since it's insecure to silently ignore the
flag[2]). All new security-related flags therefore have a tough road to
being added to openat(2).
Userspace also has a hard time figuring out whether a particular flag is
supported on a particular kernel. While it is now possible with
contemporary kernels (thanks to [3]), older kernels will expose unknown
flag bits through fcntl(F_GETFL). Giving a clear -EINVAL during
openat(2) time matches modern syscall designs and is far more
fool-proof.
In addition, the newly-added path resolution restriction LOOKUP flags
(which we would like to expose to user-space) don't feel related to the
pre-existing O_* flag set -- they affect all components of path lookup.
We'd therefore like to add a new flag argument.
Adding a new syscall allows us to finally fix the flag-ignoring problem,
and we can make it extensible enough so that we will hopefully never
need an openat3(2).
/* Syscall Prototype. */
/*
* open_how is an extensible structure (similar in interface to
* clone3(2) or sched_setattr(2)). The size parameter must be set to
* sizeof(struct open_how), to allow for future extensions. All future
* extensions will be appended to open_how, with their zero value
* acting as a no-op default.
*/
struct open_how { /* ... */ };
int openat2(int dfd, const char *pathname,
struct open_how *how, size_t size);
/* Description. */
The initial version of 'struct open_how' contains the following fields:
flags
Used to specify openat(2)-style flags. However, any unknown flag
bits or otherwise incorrect flag combinations (like O_PATH|O_RDWR)
will result in -EINVAL. In addition, this field is 64-bits wide to
allow for more O_ flags than currently permitted with openat(2).
mode
The file mode for O_CREAT or O_TMPFILE.
Must be set to zero if flags does not contain O_CREAT or O_TMPFILE.
resolve
Restrict path resolution (in contrast to O_* flags they affect all
path components). The current set of flags are as follows (at the
moment, all of the RESOLVE_ flags are implemented as just passing
the corresponding LOOKUP_ flag).
RESOLVE_NO_XDEV => LOOKUP_NO_XDEV
RESOLVE_NO_SYMLINKS => LOOKUP_NO_SYMLINKS
RESOLVE_NO_MAGICLINKS => LOOKUP_NO_MAGICLINKS
RESOLVE_BENEATH => LOOKUP_BENEATH
RESOLVE_IN_ROOT => LOOKUP_IN_ROOT
open_how does not contain an embedded size field, because it is of
little benefit (userspace can figure out the kernel open_how size at
runtime fairly easily without it). It also only contains u64s (even
though ->mode arguably should be a u16) to avoid having padding fields
which are never used in the future.
Note that as a result of the new how->flags handling, O_PATH|O_TMPFILE
is no longer permitted for openat(2). As far as I can tell, this has
always been a bug and appears to not be used by userspace (and I've not
seen any problems on my machines by disallowing it). If it turns out
this breaks something, we can special-case it and only permit it for
openat(2) but not openat2(2).
After input from Florian Weimer, the new open_how and flag definitions
are inside a separate header from uapi/linux/fcntl.h, to avoid problems
that glibc has with importing that header.
/* Testing. */
In a follow-up patch there are over 200 selftests which ensure that this
syscall has the correct semantics and will correctly handle several
attack scenarios.
In addition, I've written a userspace library[4] which provides
convenient wrappers around openat2(RESOLVE_IN_ROOT) (this is necessary
because no other syscalls support RESOLVE_IN_ROOT, and thus lots of care
must be taken when using RESOLVE_IN_ROOT'd file descriptors with other
syscalls). During the development of this patch, I've run numerous
verification tests using libpathrs (showing that the API is reasonably
usable by userspace).
/* Future Work. */
Additional RESOLVE_ flags have been suggested during the review period.
These can be easily implemented separately (such as blocking auto-mount
during resolution).
Furthermore, there are some other proposed changes to the openat(2)
interface (the most obvious example is magic-link hardening[5]) which
would be a good opportunity to add a way for userspace to restrict how
O_PATH file descriptors can be re-opened.
Another possible avenue of future work would be some kind of
CHECK_FIELDS[6] flag which causes the kernel to indicate to userspace
which openat2(2) flags and fields are supported by the current kernel
(to avoid userspace having to go through several guesses to figure it
out).
[1]: https://lwn.net/Articles/588444/
[2]: https://lore.kernel.org/lkml/CA+55aFyyxJL1LyXZeBsf2ypriraj5ut1XkNDsunRBqgVjZU_6Q@mail.gmail.com
[3]: commit 629e014bb834 ("fs: completely ignore unknown open flags")
[4]: https://sourceware.org/bugzilla/show_bug.cgi?id=17523
[5]: https://lore.kernel.org/lkml/20190930183316.10190-2-cyphar@cyphar.com/
[6]: https://youtu.be/ggD-eb3yPVs
Suggested-by: Christian Brauner <christian.brauner@ubuntu.com>
Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>
Signed-off-by: Al Viro <viro@zeniv.linux.org.uk>
2020-01-18 12:07:59 +00:00
|
|
|
437 common openat2 sys_openat2 sys_openat2
|
2020-01-07 17:59:26 +00:00
|
|
|
438 common pidfd_getfd sys_pidfd_getfd sys_pidfd_getfd
|
2020-05-14 14:44:25 +00:00
|
|
|
439 common faccessat2 sys_faccessat2 sys_faccessat2
|
mm/madvise: introduce process_madvise() syscall: an external memory hinting API
There is usecase that System Management Software(SMS) want to give a
memory hint like MADV_[COLD|PAGEEOUT] to other processes and in the
case of Android, it is the ActivityManagerService.
The information required to make the reclaim decision is not known to the
app. Instead, it is known to the centralized userspace
daemon(ActivityManagerService), and that daemon must be able to initiate
reclaim on its own without any app involvement.
To solve the issue, this patch introduces a new syscall
process_madvise(2). It uses pidfd of an external process to give the
hint. It also supports vector address range because Android app has
thousands of vmas due to zygote so it's totally waste of CPU and power if
we should call the syscall one by one for each vma.(With testing 2000-vma
syscall vs 1-vector syscall, it showed 15% performance improvement. I
think it would be bigger in real practice because the testing ran very
cache friendly environment).
Another potential use case for the vector range is to amortize the cost
ofTLB shootdowns for multiple ranges when using MADV_DONTNEED; this could
benefit users like TCP receive zerocopy and malloc implementations. In
future, we could find more usecases for other advises so let's make it
happens as API since we introduce a new syscall at this moment. With
that, existing madvise(2) user could replace it with process_madvise(2)
with their own pid if they want to have batch address ranges support
feature.
ince it could affect other process's address range, only privileged
process(PTRACE_MODE_ATTACH_FSCREDS) or something else(e.g., being the same
UID) gives it the right to ptrace the process could use it successfully.
The flag argument is reserved for future use if we need to extend the API.
I think supporting all hints madvise has/will supported/support to
process_madvise is rather risky. Because we are not sure all hints make
sense from external process and implementation for the hint may rely on
the caller being in the current context so it could be error-prone. Thus,
I just limited hints as MADV_[COLD|PAGEOUT] in this patch.
If someone want to add other hints, we could hear the usecase and review
it for each hint. It's safer for maintenance rather than introducing a
buggy syscall but hard to fix it later.
So finally, the API is as follows,
ssize_t process_madvise(int pidfd, const struct iovec *iovec,
unsigned long vlen, int advice, unsigned int flags);
DESCRIPTION
The process_madvise() system call is used to give advice or directions
to the kernel about the address ranges from external process as well as
local process. It provides the advice to address ranges of process
described by iovec and vlen. The goal of such advice is to improve
system or application performance.
The pidfd selects the process referred to by the PID file descriptor
specified in pidfd. (See pidofd_open(2) for further information)
The pointer iovec points to an array of iovec structures, defined in
<sys/uio.h> as:
struct iovec {
void *iov_base; /* starting address */
size_t iov_len; /* number of bytes to be advised */
};
The iovec describes address ranges beginning at address(iov_base)
and with size length of bytes(iov_len).
The vlen represents the number of elements in iovec.
The advice is indicated in the advice argument, which is one of the
following at this moment if the target process specified by pidfd is
external.
MADV_COLD
MADV_PAGEOUT
Permission to provide a hint to external process is governed by a
ptrace access mode PTRACE_MODE_ATTACH_FSCREDS check; see ptrace(2).
The process_madvise supports every advice madvise(2) has if target
process is in same thread group with calling process so user could
use process_madvise(2) to extend existing madvise(2) to support
vector address ranges.
RETURN VALUE
On success, process_madvise() returns the number of bytes advised.
This return value may be less than the total number of requested
bytes, if an error occurred. The caller should check return value
to determine whether a partial advice occurred.
FAQ:
Q.1 - Why does any external entity have better knowledge?
Quote from Sandeep
"For Android, every application (including the special SystemServer)
are forked from Zygote. The reason of course is to share as many
libraries and classes between the two as possible to benefit from the
preloading during boot.
After applications start, (almost) all of the APIs end up calling into
this SystemServer process over IPC (binder) and back to the
application.
In a fully running system, the SystemServer monitors every single
process periodically to calculate their PSS / RSS and also decides
which process is "important" to the user for interactivity.
So, because of how these processes start _and_ the fact that the
SystemServer is looping to monitor each process, it does tend to *know*
which address range of the application is not used / useful.
Besides, we can never rely on applications to clean things up
themselves. We've had the "hey app1, the system is low on memory,
please trim your memory usage down" notifications for a long time[1].
They rely on applications honoring the broadcasts and very few do.
So, if we want to avoid the inevitable killing of the application and
restarting it, some way to be able to tell the OS about unimportant
memory in these applications will be useful.
- ssp
Q.2 - How to guarantee the race(i.e., object validation) between when
giving a hint from an external process and get the hint from the target
process?
process_madvise operates on the target process's address space as it
exists at the instant that process_madvise is called. If the space
target process can run between the time the process_madvise process
inspects the target process address space and the time that
process_madvise is actually called, process_madvise may operate on
memory regions that the calling process does not expect. It's the
responsibility of the process calling process_madvise to close this
race condition. For example, the calling process can suspend the
target process with ptrace, SIGSTOP, or the freezer cgroup so that it
doesn't have an opportunity to change its own address space before
process_madvise is called. Another option is to operate on memory
regions that the caller knows a priori will be unchanged in the target
process. Yet another option is to accept the race for certain
process_madvise calls after reasoning that mistargeting will do no
harm. The suggested API itself does not provide synchronization. It
also apply other APIs like move_pages, process_vm_write.
The race isn't really a problem though. Why is it so wrong to require
that callers do their own synchronization in some manner? Nobody
objects to write(2) merely because it's possible for two processes to
open the same file and clobber each other's writes --- instead, we tell
people to use flock or something. Think about mmap. It never
guarantees newly allocated address space is still valid when the user
tries to access it because other threads could unmap the memory right
before. That's where we need synchronization by using other API or
design from userside. It shouldn't be part of API itself. If someone
needs more fine-grained synchronization rather than process level,
there were two ideas suggested - cookie[2] and anon-fd[3]. Both are
applicable via using last reserved argument of the API but I don't
think it's necessary right now since we have already ways to prevent
the race so don't want to add additional complexity with more
fine-grained optimization model.
To make the API extend, it reserved an unsigned long as last argument
so we could support it in future if someone really needs it.
Q.3 - Why doesn't ptrace work?
Injecting an madvise in the target process using ptrace would not work
for us because such injected madvise would have to be executed by the
target process, which means that process would have to be runnable and
that creates the risk of the abovementioned race and hinting a wrong
VMA. Furthermore, we want to act the hint in caller's context, not the
callee's, because the callee is usually limited in cpuset/cgroups or
even freezed state so they can't act by themselves quick enough, which
causes more thrashing/kill. It doesn't work if the target process are
ptraced(e.g., strace, debugger, minidump) because a process can have at
most one ptracer.
[1] https://developer.android.com/topic/performance/memory"
[2] process_getinfo for getting the cookie which is updated whenever
vma of process address layout are changed - Daniel Colascione -
https://lore.kernel.org/lkml/20190520035254.57579-1-minchan@kernel.org/T/#m7694416fd179b2066a2c62b5b139b14e3894e224
[3] anonymous fd which is used for the object(i.e., address range)
validation - Michal Hocko -
https://lore.kernel.org/lkml/20200120112722.GY18451@dhcp22.suse.cz/
[minchan@kernel.org: fix process_madvise build break for arm64]
Link: http://lkml.kernel.org/r/20200303145756.GA219683@google.com
[minchan@kernel.org: fix build error for mips of process_madvise]
Link: http://lkml.kernel.org/r/20200508052517.GA197378@google.com
[akpm@linux-foundation.org: fix patch ordering issue]
[akpm@linux-foundation.org: fix arm64 whoops]
[minchan@kernel.org: make process_madvise() vlen arg have type size_t, per Florian]
[akpm@linux-foundation.org: fix i386 build]
[sfr@canb.auug.org.au: fix syscall numbering]
Link: https://lkml.kernel.org/r/20200905142639.49fc3f1a@canb.auug.org.au
[sfr@canb.auug.org.au: madvise.c needs compat.h]
Link: https://lkml.kernel.org/r/20200908204547.285646b4@canb.auug.org.au
[minchan@kernel.org: fix mips build]
Link: https://lkml.kernel.org/r/20200909173655.GC2435453@google.com
[yuehaibing@huawei.com: remove duplicate header which is included twice]
Link: https://lkml.kernel.org/r/20200915121550.30584-1-yuehaibing@huawei.com
[minchan@kernel.org: do not use helper functions for process_madvise]
Link: https://lkml.kernel.org/r/20200921175539.GB387368@google.com
[akpm@linux-foundation.org: pidfd_get_pid() gained an argument]
[sfr@canb.auug.org.au: fix up for "iov_iter: transparently handle compat iovecs in import_iovec"]
Link: https://lkml.kernel.org/r/20200928212542.468e1fef@canb.auug.org.au
Signed-off-by: Minchan Kim <minchan@kernel.org>
Signed-off-by: YueHaibing <yuehaibing@huawei.com>
Signed-off-by: Stephen Rothwell <sfr@canb.auug.org.au>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Reviewed-by: Suren Baghdasaryan <surenb@google.com>
Reviewed-by: Vlastimil Babka <vbabka@suse.cz>
Acked-by: David Rientjes <rientjes@google.com>
Cc: Alexander Duyck <alexander.h.duyck@linux.intel.com>
Cc: Brian Geffon <bgeffon@google.com>
Cc: Christian Brauner <christian@brauner.io>
Cc: Daniel Colascione <dancol@google.com>
Cc: Jann Horn <jannh@google.com>
Cc: Jens Axboe <axboe@kernel.dk>
Cc: Joel Fernandes <joel@joelfernandes.org>
Cc: Johannes Weiner <hannes@cmpxchg.org>
Cc: John Dias <joaodias@google.com>
Cc: Kirill Tkhai <ktkhai@virtuozzo.com>
Cc: Michal Hocko <mhocko@suse.com>
Cc: Oleksandr Natalenko <oleksandr@redhat.com>
Cc: Sandeep Patil <sspatil@google.com>
Cc: SeongJae Park <sj38.park@gmail.com>
Cc: SeongJae Park <sjpark@amazon.de>
Cc: Shakeel Butt <shakeelb@google.com>
Cc: Sonny Rao <sonnyrao@google.com>
Cc: Tim Murray <timmurray@google.com>
Cc: Christian Brauner <christian.brauner@ubuntu.com>
Cc: Florian Weimer <fw@deneb.enyo.de>
Cc: <linux-man@vger.kernel.org>
Link: http://lkml.kernel.org/r/20200302193630.68771-3-minchan@kernel.org
Link: http://lkml.kernel.org/r/20200508183320.GA125527@google.com
Link: http://lkml.kernel.org/r/20200622192900.22757-4-minchan@kernel.org
Link: https://lkml.kernel.org/r/20200901000633.1920247-4-minchan@kernel.org
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2020-10-17 23:14:59 +00:00
|
|
|
440 common process_madvise sys_process_madvise sys_process_madvise
|
2020-12-20 09:58:30 +00:00
|
|
|
441 common epoll_pwait2 sys_epoll_pwait2 compat_sys_epoll_pwait2
|
fs: add mount_setattr()
This implements the missing mount_setattr() syscall. While the new mount
api allows to change the properties of a superblock there is currently
no way to change the properties of a mount or a mount tree using file
descriptors which the new mount api is based on. In addition the old
mount api has the restriction that mount options cannot be applied
recursively. This hasn't changed since changing mount options on a
per-mount basis was implemented in [1] and has been a frequent request
not just for convenience but also for security reasons. The legacy
mount syscall is unable to accommodate this behavior without introducing
a whole new set of flags because MS_REC | MS_REMOUNT | MS_BIND |
MS_RDONLY | MS_NOEXEC | [...] only apply the mount option to the topmost
mount. Changing MS_REC to apply to the whole mount tree would mean
introducing a significant uapi change and would likely cause significant
regressions.
The new mount_setattr() syscall allows to recursively clear and set
mount options in one shot. Multiple calls to change mount options
requesting the same changes are idempotent:
int mount_setattr(int dfd, const char *path, unsigned flags,
struct mount_attr *uattr, size_t usize);
Flags to modify path resolution behavior are specified in the @flags
argument. Currently, AT_EMPTY_PATH, AT_RECURSIVE, AT_SYMLINK_NOFOLLOW,
and AT_NO_AUTOMOUNT are supported. If useful, additional lookup flags to
restrict path resolution as introduced with openat2() might be supported
in the future.
The mount_setattr() syscall can be expected to grow over time and is
designed with extensibility in mind. It follows the extensible syscall
pattern we have used with other syscalls such as openat2(), clone3(),
sched_{set,get}attr(), and others.
The set of mount options is passed in the uapi struct mount_attr which
currently has the following layout:
struct mount_attr {
__u64 attr_set;
__u64 attr_clr;
__u64 propagation;
__u64 userns_fd;
};
The @attr_set and @attr_clr members are used to clear and set mount
options. This way a user can e.g. request that a set of flags is to be
raised such as turning mounts readonly by raising MOUNT_ATTR_RDONLY in
@attr_set while at the same time requesting that another set of flags is
to be lowered such as removing noexec from a mount tree by specifying
MOUNT_ATTR_NOEXEC in @attr_clr.
Note, since the MOUNT_ATTR_<atime> values are an enum starting from 0,
not a bitmap, users wanting to transition to a different atime setting
cannot simply specify the atime setting in @attr_set, but must also
specify MOUNT_ATTR__ATIME in the @attr_clr field. So we ensure that
MOUNT_ATTR__ATIME can't be partially set in @attr_clr and that @attr_set
can't have any atime bits set if MOUNT_ATTR__ATIME isn't set in
@attr_clr.
The @propagation field lets callers specify the propagation type of a
mount tree. Propagation is a single property that has four different
settings and as such is not really a flag argument but an enum.
Specifically, it would be unclear what setting and clearing propagation
settings in combination would amount to. The legacy mount() syscall thus
forbids the combination of multiple propagation settings too. The goal
is to keep the semantics of mount propagation somewhat simple as they
are overly complex as it is.
The @userns_fd field lets user specify a user namespace whose idmapping
becomes the idmapping of the mount. This is implemented and explained in
detail in the next patch.
[1]: commit 2e4b7fcd9260 ("[PATCH] r/o bind mounts: honor mount writer counts at remount")
Link: https://lore.kernel.org/r/20210121131959.646623-35-christian.brauner@ubuntu.com
Cc: David Howells <dhowells@redhat.com>
Cc: Aleksa Sarai <cyphar@cyphar.com>
Cc: Al Viro <viro@zeniv.linux.org.uk>
Cc: linux-fsdevel@vger.kernel.org
Cc: linux-api@vger.kernel.org
Reviewed-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Christian Brauner <christian.brauner@ubuntu.com>
2021-01-21 13:19:53 +00:00
|
|
|
442 common mount_setattr sys_mount_setattr sys_mount_setattr
|
2021-05-31 16:42:58 +00:00
|
|
|
443 common quotactl_fd sys_quotactl_fd sys_quotactl_fd
|
2021-04-22 15:41:19 +00:00
|
|
|
444 common landlock_create_ruleset sys_landlock_create_ruleset sys_landlock_create_ruleset
|
|
|
|
445 common landlock_add_rule sys_landlock_add_rule sys_landlock_add_rule
|
|
|
|
446 common landlock_restrict_self sys_landlock_restrict_self sys_landlock_restrict_self
|
2023-04-14 12:30:45 +00:00
|
|
|
447 common memfd_secret sys_memfd_secret sys_memfd_secret
|
2021-09-02 22:00:33 +00:00
|
|
|
448 common process_mrelease sys_process_mrelease sys_process_mrelease
|
2021-11-01 13:38:18 +00:00
|
|
|
449 common futex_waitv sys_futex_waitv sys_futex_waitv
|
2022-01-14 22:08:21 +00:00
|
|
|
450 common set_mempolicy_home_node sys_set_mempolicy_home_node sys_set_mempolicy_home_node
|
2023-05-10 19:58:06 +00:00
|
|
|
451 common cachestat sys_cachestat sys_cachestat
|
2023-07-11 16:16:05 +00:00
|
|
|
452 common fchmodat2 sys_fchmodat2 sys_fchmodat2
|
2023-09-14 18:58:03 +00:00
|
|
|
453 common map_shadow_stack sys_map_shadow_stack sys_map_shadow_stack
|
2023-09-21 10:45:10 +00:00
|
|
|
454 common futex_wake sys_futex_wake sys_futex_wake
|
2023-09-21 10:45:12 +00:00
|
|
|
455 common futex_wait sys_futex_wait sys_futex_wait
|
2023-11-02 01:28:33 +00:00
|
|
|
456 common futex_requeue sys_futex_requeue sys_futex_requeue
|
2023-10-25 14:02:04 +00:00
|
|
|
457 common statmount sys_statmount sys_statmount
|
|
|
|
458 common listmount sys_listmount sys_listmount
|
lsm/stable-6.8 PR 20240105
-----BEGIN PGP SIGNATURE-----
iQJIBAABCAAyFiEES0KozwfymdVUl37v6iDy2pc3iXMFAmWYKUIUHHBhdWxAcGF1
bC1tb29yZS5jb20ACgkQ6iDy2pc3iXNyHw/+IKnqL1MZ5QS+/HtSzi4jCL47N9yZ
OHLol6XswyEGHH9myKPPGnT5lVA93v98v4ty2mws7EJUSGZQQUntYBPbU9Gi40+B
XDzYSRocoj96sdlKeOJMgaWo3NBRD9HYSoGPDNWZixy6m+bLPk/Dqhn3FabKf1lo
2qQSmstvChFRmVNkmgaQnBCAtWVqla4EJEL0EKX6cspHbuzRNTeJdTPn6Q/zOUVL
O2znOZuEtSVpYS7yg3uJT0hHD8H0GnIciAcDAhyPSBL5Uk5l6gwJiACcdRfLRbgp
QM5Z4qUFdKljV5XBCzYnfhhrx1df08h1SG84El8UK8HgTTfOZfYmawByJRWNJSQE
TdCmtyyvEbfb61CKBFVwD7Tzb9/y8WgcY5N3Un8uCQqRzFIO+6cghHri5NrVhifp
nPFlP4klxLHh3d7ZVekLmCMHbpaacRyJKwLy+f/nwbBEID47jpPkvZFIpbalat+r
QaKRBNWdTeV+GZ+Yu0uWsI029aQnpcO1kAnGg09fl6b/dsmxeKOVWebir25AzQ++
a702S8HRmj80X+VnXHU9a64XeGtBH7Nq0vu0lGHQPgwhSx/9P6/qICEPwsIriRjR
I9OulWt4OBPDtlsonHFgDs+lbnd0Z0GJUwYT8e9pjRDMxijVO9lhAXyglVRmuNR8
to2ByKP5BO+Vh8Y=
=Py+n
-----END PGP SIGNATURE-----
Merge tag 'lsm-pr-20240105' of git://git.kernel.org/pub/scm/linux/kernel/git/pcmoore/lsm
Pull security module updates from Paul Moore:
- Add three new syscalls: lsm_list_modules(), lsm_get_self_attr(), and
lsm_set_self_attr().
The first syscall simply lists the LSMs enabled, while the second and
third get and set the current process' LSM attributes. Yes, these
syscalls may provide similar functionality to what can be found under
/proc or /sys, but they were designed to support multiple,
simultaneaous (stacked) LSMs from the start as opposed to the current
/proc based solutions which were created at a time when only one LSM
was allowed to be active at a given time.
We have spent considerable time discussing ways to extend the
existing /proc interfaces to support multiple, simultaneaous LSMs and
even our best ideas have been far too ugly to support as a kernel
API; after +20 years in the kernel, I felt the LSM layer had
established itself enough to justify a handful of syscalls.
Support amongst the individual LSM developers has been nearly
unanimous, with a single objection coming from Tetsuo (TOMOYO) as he
is worried that the LSM_ID_XXX token concept will make it more
difficult for out-of-tree LSMs to survive. Several members of the LSM
community have demonstrated the ability for out-of-tree LSMs to
continue to exist by picking high/unused LSM_ID values as well as
pointing out that many kernel APIs rely on integer identifiers, e.g.
syscalls (!), but unfortunately Tetsuo's objections remain.
My personal opinion is that while I have no interest in penalizing
out-of-tree LSMs, I'm not going to penalize in-tree development to
support out-of-tree development, and I view this as a necessary step
forward to support the push for expanded LSM stacking and reduce our
reliance on /proc and /sys which has occassionally been problematic
for some container users. Finally, we have included the linux-api
folks on (all?) recent revisions of the patchset and addressed all of
their concerns.
- Add a new security_file_ioctl_compat() LSM hook to handle the 32-bit
ioctls on 64-bit systems problem.
This patch includes support for all of the existing LSMs which
provide ioctl hooks, although it turns out only SELinux actually
cares about the individual ioctls. It is worth noting that while
Casey (Smack) and Tetsuo (TOMOYO) did not give explicit ACKs to this
patch, they did both indicate they are okay with the changes.
- Fix a potential memory leak in the CALIPSO code when IPv6 is disabled
at boot.
While it's good that we are fixing this, I doubt this is something
users are seeing in the wild as you need to both disable IPv6 and
then attempt to configure IPv6 labeled networking via
NetLabel/CALIPSO; that just doesn't make much sense.
Normally this would go through netdev, but Jakub asked me to take
this patch and of all the trees I maintain, the LSM tree seemed like
the best fit.
- Update the LSM MAINTAINERS entry with additional information about
our process docs, patchwork, bug reporting, etc.
I also noticed that the Lockdown LSM is missing a dedicated
MAINTAINERS entry so I've added that to the pull request. I've been
working with one of the major Lockdown authors/contributors to see if
they are willing to step up and assume a Lockdown maintainer role;
hopefully that will happen soon, but in the meantime I'll continue to
look after it.
- Add a handful of mailmap entries for Serge Hallyn and myself.
* tag 'lsm-pr-20240105' of git://git.kernel.org/pub/scm/linux/kernel/git/pcmoore/lsm: (27 commits)
lsm: new security_file_ioctl_compat() hook
lsm: Add a __counted_by() annotation to lsm_ctx.ctx
calipso: fix memory leak in netlbl_calipso_add_pass()
selftests: remove the LSM_ID_IMA check in lsm/lsm_list_modules_test
MAINTAINERS: add an entry for the lockdown LSM
MAINTAINERS: update the LSM entry
mailmap: add entries for Serge Hallyn's dead accounts
mailmap: update/replace my old email addresses
lsm: mark the lsm_id variables are marked as static
lsm: convert security_setselfattr() to use memdup_user()
lsm: align based on pointer length in lsm_fill_user_ctx()
lsm: consolidate buffer size handling into lsm_fill_user_ctx()
lsm: correct error codes in security_getselfattr()
lsm: cleanup the size counters in security_getselfattr()
lsm: don't yet account for IMA in LSM_CONFIG_COUNT calculation
lsm: drop LSM_ID_IMA
LSM: selftests for Linux Security Module syscalls
SELinux: Add selfattr hooks
AppArmor: Add selfattr hooks
Smack: implement setselfattr and getselfattr hooks
...
2024-01-09 20:57:46 +00:00
|
|
|
459 common lsm_get_self_attr sys_lsm_get_self_attr sys_lsm_get_self_attr
|
|
|
|
460 common lsm_set_self_attr sys_lsm_set_self_attr sys_lsm_set_self_attr
|
|
|
|
461 common lsm_list_modules sys_lsm_list_modules sys_lsm_list_modules
|