1 // SPDX-License-Identifier: GPL-2.0
2 #include <linux/kernel.h>
3 #include <linux/errno.h>
4 #include <linux/err.h>
5 #include <linux/mm.h>
6 #include <linux/slab.h>
7 #include <linux/vmalloc.h>
8 #include <linux/pagemap.h>
9 #include <linux/sched.h>
10
11 /**
12 * get_vaddr_frames() - map virtual addresses to pfns
13 * @start: starting user address
14 * @nr_frames: number of pages / pfns from start to map
15 * @gup_flags: flags modifying lookup behaviour
16 * @vec: structure which receives pages / pfns of the addresses mapped.
17 * It should have space for at least nr_frames entries.
18 *
19 * This function maps virtual addresses from @start and fills @vec structure
20 * with page frame numbers or page pointers to corresponding pages (choice
21 * depends on the type of the vma underlying the virtual address). If @start
22 * belongs to a normal vma, the function grabs reference to each of the pages
23 * to pin them in memory. If @start belongs to VM_IO | VM_PFNMAP vma, we don't
24 * touch page structures and the caller must make sure pfns aren't reused for
25 * anything else while he is using them.
26 *
27 * The function returns number of pages mapped which may be less than
28 * @nr_frames. In particular we stop mapping if there are more vmas of
29 * different type underlying the specified range of virtual addresses.
30 * When the function isn't able to map a single page, it returns error.
31 *
32 * This function takes care of grabbing mmap_sem as necessary.
33 */
get_vaddr_frames(unsigned long start,unsigned int nr_frames,unsigned int gup_flags,struct frame_vector * vec)34 int get_vaddr_frames(unsigned long start, unsigned int nr_frames,
35 unsigned int gup_flags, struct frame_vector *vec)
36 {
37 struct mm_struct *mm = current->mm;
38 struct vm_area_struct *vma;
39 int ret = 0;
40 int locked;
41
42 if (nr_frames == 0)
43 return 0;
44
45 if (WARN_ON_ONCE(nr_frames > vec->nr_allocated))
46 nr_frames = vec->nr_allocated;
47
48 start = untagged_addr(start);
49
50 down_read(&mm->mmap_sem);
51 locked = 1;
52 vma = find_vma_intersection(mm, start, start + 1);
53 if (!vma) {
54 ret = -EFAULT;
55 goto out;
56 }
57
58 /*
59 * While get_vaddr_frames() could be used for transient (kernel
60 * controlled lifetime) pinning of memory pages all current
61 * users establish long term (userspace controlled lifetime)
62 * page pinning. Treat get_vaddr_frames() like
63 * get_user_pages_longterm() and disallow it for filesystem-dax
64 * mappings.
65 */
66 if (vma_is_fsdax(vma)) {
67 ret = -EOPNOTSUPP;
68 goto out;
69 }
70
71 if (!(vma->vm_flags & (VM_IO | VM_PFNMAP))) {
72 vec->got_ref = true;
73 vec->is_pfns = false;
74 ret = get_user_pages_locked(start, nr_frames,
75 gup_flags, (struct page **)(vec->ptrs), &locked);
76 if (likely(ret > 0))
77 goto out;
78 }
79
80 /* This used to (racily) return non-refcounted pfns. Let people know */
81 WARN_ONCE(1, "get_vaddr_frames() cannot follow VM_IO mapping");
82 vec->nr_frames = 0;
83
84 out:
85 if (locked)
86 up_read(&mm->mmap_sem);
87 if (!ret)
88 ret = -EFAULT;
89 if (ret > 0)
90 vec->nr_frames = ret;
91 return ret;
92 }
93 EXPORT_SYMBOL(get_vaddr_frames);
94
95 /**
96 * put_vaddr_frames() - drop references to pages if get_vaddr_frames() acquired
97 * them
98 * @vec: frame vector to put
99 *
100 * Drop references to pages if get_vaddr_frames() acquired them. We also
101 * invalidate the frame vector so that it is prepared for the next call into
102 * get_vaddr_frames().
103 */
put_vaddr_frames(struct frame_vector * vec)104 void put_vaddr_frames(struct frame_vector *vec)
105 {
106 int i;
107 struct page **pages;
108
109 if (!vec->got_ref)
110 goto out;
111 pages = frame_vector_pages(vec);
112 /*
113 * frame_vector_pages() might needed to do a conversion when
114 * get_vaddr_frames() got pages but vec was later converted to pfns.
115 * But it shouldn't really fail to convert pfns back...
116 */
117 if (WARN_ON(IS_ERR(pages)))
118 goto out;
119 for (i = 0; i < vec->nr_frames; i++)
120 put_page(pages[i]);
121 vec->got_ref = false;
122 out:
123 vec->nr_frames = 0;
124 }
125 EXPORT_SYMBOL(put_vaddr_frames);
126
127 /**
128 * frame_vector_to_pages - convert frame vector to contain page pointers
129 * @vec: frame vector to convert
130 *
131 * Convert @vec to contain array of page pointers. If the conversion is
132 * successful, return 0. Otherwise return an error. Note that we do not grab
133 * page references for the page structures.
134 */
frame_vector_to_pages(struct frame_vector * vec)135 int frame_vector_to_pages(struct frame_vector *vec)
136 {
137 int i;
138 unsigned long *nums;
139 struct page **pages;
140
141 if (!vec->is_pfns)
142 return 0;
143 nums = frame_vector_pfns(vec);
144 for (i = 0; i < vec->nr_frames; i++)
145 if (!pfn_valid(nums[i]))
146 return -EINVAL;
147 pages = (struct page **)nums;
148 for (i = 0; i < vec->nr_frames; i++)
149 pages[i] = pfn_to_page(nums[i]);
150 vec->is_pfns = false;
151 return 0;
152 }
153 EXPORT_SYMBOL(frame_vector_to_pages);
154
155 /**
156 * frame_vector_to_pfns - convert frame vector to contain pfns
157 * @vec: frame vector to convert
158 *
159 * Convert @vec to contain array of pfns.
160 */
frame_vector_to_pfns(struct frame_vector * vec)161 void frame_vector_to_pfns(struct frame_vector *vec)
162 {
163 int i;
164 unsigned long *nums;
165 struct page **pages;
166
167 if (vec->is_pfns)
168 return;
169 pages = (struct page **)(vec->ptrs);
170 nums = (unsigned long *)pages;
171 for (i = 0; i < vec->nr_frames; i++)
172 nums[i] = page_to_pfn(pages[i]);
173 vec->is_pfns = true;
174 }
175 EXPORT_SYMBOL(frame_vector_to_pfns);
176
177 /**
178 * frame_vector_create() - allocate & initialize structure for pinned pfns
179 * @nr_frames: number of pfns slots we should reserve
180 *
181 * Allocate and initialize struct pinned_pfns to be able to hold @nr_pfns
182 * pfns.
183 */
frame_vector_create(unsigned int nr_frames)184 struct frame_vector *frame_vector_create(unsigned int nr_frames)
185 {
186 struct frame_vector *vec;
187 int size = sizeof(struct frame_vector) + sizeof(void *) * nr_frames;
188
189 if (WARN_ON_ONCE(nr_frames == 0))
190 return NULL;
191 /*
192 * This is absurdly high. It's here just to avoid strange effects when
193 * arithmetics overflows.
194 */
195 if (WARN_ON_ONCE(nr_frames > INT_MAX / sizeof(void *) / 2))
196 return NULL;
197 /*
198 * Avoid higher order allocations, use vmalloc instead. It should
199 * be rare anyway.
200 */
201 vec = kvmalloc(size, GFP_KERNEL);
202 if (!vec)
203 return NULL;
204 vec->nr_allocated = nr_frames;
205 vec->nr_frames = 0;
206 return vec;
207 }
208 EXPORT_SYMBOL(frame_vector_create);
209
210 /**
211 * frame_vector_destroy() - free memory allocated to carry frame vector
212 * @vec: Frame vector to free
213 *
214 * Free structure allocated by frame_vector_create() to carry frames.
215 */
frame_vector_destroy(struct frame_vector * vec)216 void frame_vector_destroy(struct frame_vector *vec)
217 {
218 /* Make sure put_vaddr_frames() got called properly... */
219 VM_BUG_ON(vec->nr_frames > 0);
220 kvfree(vec);
221 }
222 EXPORT_SYMBOL(frame_vector_destroy);
223