4 * (C) Copyright 1995 Linus Torvalds
5 * (C) Copyright 2002 Christoph Hellwig
8 #include <linux/capability.h>
9 #include <linux/mman.h>
11 #include <linux/mempolicy.h>
12 #include <linux/syscalls.h>
13 #include <linux/sched.h>
14 #include <linux/module.h>
16 int can_do_mlock(void)
18 if (capable(CAP_IPC_LOCK
))
20 if (current
->signal
->rlim
[RLIMIT_MEMLOCK
].rlim_cur
!= 0)
24 EXPORT_SYMBOL(can_do_mlock
);
26 static int mlock_fixup(struct vm_area_struct
*vma
, struct vm_area_struct
**prev
,
27 unsigned long start
, unsigned long end
, unsigned int newflags
)
29 struct mm_struct
* mm
= vma
->vm_mm
;
34 if (newflags
== vma
->vm_flags
) {
39 pgoff
= vma
->vm_pgoff
+ ((start
- vma
->vm_start
) >> PAGE_SHIFT
);
40 *prev
= vma_merge(mm
, *prev
, start
, end
, newflags
, vma
->anon_vma
,
41 vma
->vm_file
, pgoff
, vma_policy(vma
));
49 if (start
!= vma
->vm_start
) {
50 ret
= split_vma(mm
, vma
, start
, 1);
55 if (end
!= vma
->vm_end
) {
56 ret
= split_vma(mm
, vma
, end
, 0);
63 * vm_flags is protected by the mmap_sem held in write mode.
64 * It's okay if try_to_unmap_one unmaps a page just after we
65 * set VM_LOCKED, make_pages_present below will bring it back.
67 vma
->vm_flags
= newflags
;
70 * Keep track of amount of locked VM.
72 pages
= (end
- start
) >> PAGE_SHIFT
;
73 if (newflags
& VM_LOCKED
) {
75 if (!(newflags
& VM_IO
))
76 ret
= make_pages_present(start
, end
);
79 mm
->locked_vm
-= pages
;
86 static int do_mlock(unsigned long start
, size_t len
, int on
)
88 unsigned long nstart
, end
, tmp
;
89 struct vm_area_struct
* vma
, * prev
;
92 len
= PAGE_ALIGN(len
);
98 vma
= find_vma_prev(current
->mm
, start
, &prev
);
99 if (!vma
|| vma
->vm_start
> start
)
102 if (start
> vma
->vm_start
)
105 for (nstart
= start
; ; ) {
106 unsigned int newflags
;
108 /* Here we know that vma->vm_start <= nstart < vma->vm_end. */
110 newflags
= vma
->vm_flags
| VM_LOCKED
;
112 newflags
&= ~VM_LOCKED
;
117 error
= mlock_fixup(vma
, &prev
, nstart
, tmp
, newflags
);
121 if (nstart
< prev
->vm_end
)
122 nstart
= prev
->vm_end
;
127 if (!vma
|| vma
->vm_start
!= nstart
) {
135 asmlinkage
long sys_mlock(unsigned long start
, size_t len
)
137 unsigned long locked
;
138 unsigned long lock_limit
;
144 down_write(¤t
->mm
->mmap_sem
);
145 len
= PAGE_ALIGN(len
+ (start
& ~PAGE_MASK
));
148 locked
= len
>> PAGE_SHIFT
;
149 locked
+= current
->mm
->locked_vm
;
151 lock_limit
= current
->signal
->rlim
[RLIMIT_MEMLOCK
].rlim_cur
;
152 lock_limit
>>= PAGE_SHIFT
;
154 /* check against resource limits */
155 if ((locked
<= lock_limit
) || capable(CAP_IPC_LOCK
))
156 error
= do_mlock(start
, len
, 1);
157 up_write(¤t
->mm
->mmap_sem
);
161 asmlinkage
long sys_munlock(unsigned long start
, size_t len
)
165 down_write(¤t
->mm
->mmap_sem
);
166 len
= PAGE_ALIGN(len
+ (start
& ~PAGE_MASK
));
168 ret
= do_mlock(start
, len
, 0);
169 up_write(¤t
->mm
->mmap_sem
);
173 static int do_mlockall(int flags
)
175 struct vm_area_struct
* vma
, * prev
= NULL
;
176 unsigned int def_flags
= 0;
178 if (flags
& MCL_FUTURE
)
179 def_flags
= VM_LOCKED
;
180 current
->mm
->def_flags
= def_flags
;
181 if (flags
== MCL_FUTURE
)
184 for (vma
= current
->mm
->mmap
; vma
; vma
= prev
->vm_next
) {
185 unsigned int newflags
;
187 newflags
= vma
->vm_flags
| VM_LOCKED
;
188 if (!(flags
& MCL_CURRENT
))
189 newflags
&= ~VM_LOCKED
;
192 mlock_fixup(vma
, &prev
, vma
->vm_start
, vma
->vm_end
, newflags
);
198 asmlinkage
long sys_mlockall(int flags
)
200 unsigned long lock_limit
;
203 if (!flags
|| (flags
& ~(MCL_CURRENT
| MCL_FUTURE
)))
210 down_write(¤t
->mm
->mmap_sem
);
212 lock_limit
= current
->signal
->rlim
[RLIMIT_MEMLOCK
].rlim_cur
;
213 lock_limit
>>= PAGE_SHIFT
;
216 if (!(flags
& MCL_CURRENT
) || (current
->mm
->total_vm
<= lock_limit
) ||
217 capable(CAP_IPC_LOCK
))
218 ret
= do_mlockall(flags
);
219 up_write(¤t
->mm
->mmap_sem
);
224 asmlinkage
long sys_munlockall(void)
228 down_write(¤t
->mm
->mmap_sem
);
229 ret
= do_mlockall(0);
230 up_write(¤t
->mm
->mmap_sem
);
235 * Objects with different lifetime than processes (SHM_LOCK and SHM_HUGETLB
236 * shm segments) get accounted against the user_struct instead.
238 static DEFINE_SPINLOCK(shmlock_user_lock
);
240 int user_shm_lock(size_t size
, struct user_struct
*user
)
242 unsigned long lock_limit
, locked
;
245 locked
= (size
+ PAGE_SIZE
- 1) >> PAGE_SHIFT
;
246 lock_limit
= current
->signal
->rlim
[RLIMIT_MEMLOCK
].rlim_cur
;
247 lock_limit
>>= PAGE_SHIFT
;
248 spin_lock(&shmlock_user_lock
);
249 if (locked
+ user
->locked_shm
> lock_limit
&& !capable(CAP_IPC_LOCK
))
252 user
->locked_shm
+= locked
;
255 spin_unlock(&shmlock_user_lock
);
259 void user_shm_unlock(size_t size
, struct user_struct
*user
)
261 spin_lock(&shmlock_user_lock
);
262 user
->locked_shm
-= (size
+ PAGE_SIZE
- 1) >> PAGE_SHIFT
;
263 spin_unlock(&shmlock_user_lock
);