14280637e9b86cbe1415932c45aa32abef047716
[linux-2.6.git] / mm / mlock.c
1 /*
2  *      linux/mm/mlock.c
3  *
4  *  (C) Copyright 1995 Linus Torvalds
5  *  (C) Copyright 2002 Christoph Hellwig
6  */
7
8 #include <linux/mman.h>
9 #include <linux/mm.h>
10
11
12 static int mlock_fixup(struct vm_area_struct * vma, 
13         unsigned long start, unsigned long end, unsigned int newflags)
14 {
15         struct mm_struct * mm = vma->vm_mm;
16         int pages;
17         int ret = 0;
18
19         if (newflags == vma->vm_flags)
20                 goto out;
21
22         if (start != vma->vm_start) {
23                 if (split_vma(mm, vma, start, 1)) {
24                         ret = -EAGAIN;
25                         goto out;
26                 }
27         }
28
29         if (end != vma->vm_end) {
30                 if (split_vma(mm, vma, end, 0)) {
31                         ret = -EAGAIN;
32                         goto out;
33                 }
34         }
35
36         /*
37          * vm_flags is protected by the mmap_sem held in write mode.
38          * It's okay if try_to_unmap_one unmaps a page just after we
39          * set VM_LOCKED, make_pages_present below will bring it back.
40          */
41         vma->vm_flags = newflags;
42
43         /*
44          * Keep track of amount of locked VM.
45          */
46         pages = (end - start) >> PAGE_SHIFT;
47         if (newflags & VM_LOCKED) {
48                 pages = -pages;
49                 ret = make_pages_present(start, end);
50         }
51
52         vma->vm_mm->locked_vm -= pages;
53 out:
54         return ret;
55 }
56
57 static int do_mlock(unsigned long start, size_t len, int on)
58 {
59         unsigned long nstart, end, tmp;
60         struct vm_area_struct * vma, * next;
61         int error;
62
63         if (on && !can_do_mlock())
64                 return -EPERM;
65         len = PAGE_ALIGN(len);
66         end = start + len;
67         if (end < start)
68                 return -EINVAL;
69         if (end == start)
70                 return 0;
71         vma = find_vma(current->mm, start);
72         if (!vma || vma->vm_start > start)
73                 return -ENOMEM;
74
75         for (nstart = start ; ; ) {
76                 unsigned int newflags;
77
78                 /* Here we know that  vma->vm_start <= nstart < vma->vm_end. */
79
80                 newflags = vma->vm_flags | VM_LOCKED;
81                 if (!on)
82                         newflags &= ~VM_LOCKED;
83
84                 if (vma->vm_end >= end) {
85                         error = mlock_fixup(vma, nstart, end, newflags);
86                         break;
87                 }
88
89                 tmp = vma->vm_end;
90                 next = vma->vm_next;
91                 error = mlock_fixup(vma, nstart, tmp, newflags);
92                 if (error)
93                         break;
94                 nstart = tmp;
95                 vma = next;
96                 if (!vma || vma->vm_start != nstart) {
97                         error = -ENOMEM;
98                         break;
99                 }
100         }
101         return error;
102 }
103
104 asmlinkage long sys_mlock(unsigned long start, size_t len)
105 {
106         unsigned long locked, grow;
107         unsigned long lock_limit;
108         int error = -ENOMEM;
109
110         down_write(&current->mm->mmap_sem);
111         len = PAGE_ALIGN(len + (start & ~PAGE_MASK));
112         start &= PAGE_MASK;
113
114         grow = len >> PAGE_SHIFT;
115         if (!vx_vmlocked_avail(current->mm, grow))
116                 goto out;
117         locked = current->mm->locked_vm + grow;
118
119         lock_limit = current->rlim[RLIMIT_MEMLOCK].rlim_cur;
120         lock_limit >>= PAGE_SHIFT;
121
122         /* check against resource limits */
123         if ( (locked <= lock_limit) || capable(CAP_IPC_LOCK))
124                 error = do_mlock(start, len, 1);
125 out:
126         up_write(&current->mm->mmap_sem);
127         return error;
128 }
129
130 asmlinkage long sys_munlock(unsigned long start, size_t len)
131 {
132         int ret;
133
134         down_write(&current->mm->mmap_sem);
135         len = PAGE_ALIGN(len + (start & ~PAGE_MASK));
136         start &= PAGE_MASK;
137         ret = do_mlock(start, len, 0);
138         up_write(&current->mm->mmap_sem);
139         return ret;
140 }
141
142 static int do_mlockall(int flags)
143 {
144         int error;
145         unsigned int def_flags;
146         struct vm_area_struct * vma;
147
148         if (!can_do_mlock())
149                 return -EPERM;
150
151         def_flags = 0;
152         if (flags & MCL_FUTURE)
153                 def_flags = VM_LOCKED;
154         current->mm->def_flags = def_flags;
155
156         error = 0;
157         for (vma = current->mm->mmap; vma ; vma = vma->vm_next) {
158                 unsigned int newflags;
159
160                 newflags = vma->vm_flags | VM_LOCKED;
161                 if (!(flags & MCL_CURRENT))
162                         newflags &= ~VM_LOCKED;
163
164                 /* Ignore errors */
165                 mlock_fixup(vma, vma->vm_start, vma->vm_end, newflags);
166         }
167         return error;
168 }
169
170 asmlinkage long sys_mlockall(int flags)
171 {
172         unsigned long lock_limit;
173         int ret = -EINVAL;
174
175         down_write(&current->mm->mmap_sem);
176         if (!flags || (flags & ~(MCL_CURRENT | MCL_FUTURE)))
177                 goto out;
178
179         lock_limit = current->rlim[RLIMIT_MEMLOCK].rlim_cur;
180         lock_limit >>= PAGE_SHIFT;
181
182         ret = -ENOMEM;
183         if (!vx_vmlocked_avail(current->mm, current->mm->total_vm))
184                 goto out;
185         /* check vserver lock limits? */
186         if ((current->mm->total_vm <= lock_limit) || capable(CAP_IPC_LOCK))
187                 ret = do_mlockall(flags);
188 out:
189         up_write(&current->mm->mmap_sem);
190         return ret;
191 }
192
193 asmlinkage long sys_munlockall(void)
194 {
195         int ret;
196
197         down_write(&current->mm->mmap_sem);
198         ret = do_mlockall(0);
199         up_write(&current->mm->mmap_sem);
200         return ret;
201 }