aboutsummaryrefslogtreecommitdiffstats
path: root/arch/x86/xen/p2m.c
diff options
context:
space:
mode:
authorJeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>2010-12-06 19:29:22 -0500
committerKonrad Rzeszutek Wilk <konrad.wilk@oracle.com>2011-01-11 14:31:07 -0500
commitb5eafe924bb054d7c56e6ebd18106352e8a3f916 (patch)
treeb7e88c3259df6f5a57d7b04225a053ac435c1a9d /arch/x86/xen/p2m.c
parent8d3eaea24609c7cd6fb0e6471f46a52f9e5d0202 (diff)
xen: move p2m handling to separate file
Signed-off-by: Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com> Signed-off-by: Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
Diffstat (limited to 'arch/x86/xen/p2m.c')
-rw-r--r--arch/x86/xen/p2m.c376
1 files changed, 376 insertions, 0 deletions
diff --git a/arch/x86/xen/p2m.c b/arch/x86/xen/p2m.c
new file mode 100644
index 000000000000..259ec3bb8b6f
--- /dev/null
+++ b/arch/x86/xen/p2m.c
@@ -0,0 +1,376 @@
1/*
2 * Xen leaves the responsibility for maintaining p2m mappings to the
3 * guests themselves, but it must also access and update the p2m array
4 * during suspend/resume when all the pages are reallocated.
5 *
6 * The p2m table is logically a flat array, but we implement it as a
7 * three-level tree to allow the address space to be sparse.
8 *
9 * Xen
10 * |
11 * p2m_top p2m_top_mfn
12 * / \ / \
13 * p2m_mid p2m_mid p2m_mid_mfn p2m_mid_mfn
14 * / \ / \ / /
15 * p2m p2m p2m p2m p2m p2m p2m ...
16 *
17 * The p2m_mid_mfn pages are mapped by p2m_top_mfn_p.
18 *
19 * The p2m_top and p2m_top_mfn levels are limited to 1 page, so the
20 * maximum representable pseudo-physical address space is:
21 * P2M_TOP_PER_PAGE * P2M_MID_PER_PAGE * P2M_PER_PAGE pages
22 *
23 * P2M_PER_PAGE depends on the architecture, as a mfn is always
24 * unsigned long (8 bytes on 64-bit, 4 bytes on 32), leading to
25 * 512 and 1024 entries respectively.
26 */
27
28#include <linux/init.h>
29#include <linux/module.h>
30
31#include <asm/cache.h>
32#include <asm/setup.h>
33
34#include <asm/xen/page.h>
35#include <asm/xen/hypercall.h>
36#include <asm/xen/hypervisor.h>
37
38#include "xen-ops.h"
39
40unsigned long xen_max_p2m_pfn __read_mostly;
41
42#define P2M_PER_PAGE (PAGE_SIZE / sizeof(unsigned long))
43#define P2M_MID_PER_PAGE (PAGE_SIZE / sizeof(unsigned long *))
44#define P2M_TOP_PER_PAGE (PAGE_SIZE / sizeof(unsigned long **))
45
46#define MAX_P2M_PFN (P2M_TOP_PER_PAGE * P2M_MID_PER_PAGE * P2M_PER_PAGE)
47
48/* Placeholders for holes in the address space */
49static RESERVE_BRK_ARRAY(unsigned long, p2m_missing, P2M_PER_PAGE);
50static RESERVE_BRK_ARRAY(unsigned long *, p2m_mid_missing, P2M_MID_PER_PAGE);
51static RESERVE_BRK_ARRAY(unsigned long, p2m_mid_missing_mfn, P2M_MID_PER_PAGE);
52
53static RESERVE_BRK_ARRAY(unsigned long **, p2m_top, P2M_TOP_PER_PAGE);
54static RESERVE_BRK_ARRAY(unsigned long, p2m_top_mfn, P2M_TOP_PER_PAGE);
55static RESERVE_BRK_ARRAY(unsigned long *, p2m_top_mfn_p, P2M_TOP_PER_PAGE);
56
57RESERVE_BRK(p2m_mid, PAGE_SIZE * (MAX_DOMAIN_PAGES / (P2M_PER_PAGE * P2M_MID_PER_PAGE)));
58RESERVE_BRK(p2m_mid_mfn, PAGE_SIZE * (MAX_DOMAIN_PAGES / (P2M_PER_PAGE * P2M_MID_PER_PAGE)));
59
60static inline unsigned p2m_top_index(unsigned long pfn)
61{
62 BUG_ON(pfn >= MAX_P2M_PFN);
63 return pfn / (P2M_MID_PER_PAGE * P2M_PER_PAGE);
64}
65
66static inline unsigned p2m_mid_index(unsigned long pfn)
67{
68 return (pfn / P2M_PER_PAGE) % P2M_MID_PER_PAGE;
69}
70
71static inline unsigned p2m_index(unsigned long pfn)
72{
73 return pfn % P2M_PER_PAGE;
74}
75
76static void p2m_top_init(unsigned long ***top)
77{
78 unsigned i;
79
80 for (i = 0; i < P2M_TOP_PER_PAGE; i++)
81 top[i] = p2m_mid_missing;
82}
83
84static void p2m_top_mfn_init(unsigned long *top)
85{
86 unsigned i;
87
88 for (i = 0; i < P2M_TOP_PER_PAGE; i++)
89 top[i] = virt_to_mfn(p2m_mid_missing_mfn);
90}
91
92static void p2m_top_mfn_p_init(unsigned long **top)
93{
94 unsigned i;
95
96 for (i = 0; i < P2M_TOP_PER_PAGE; i++)
97 top[i] = p2m_mid_missing_mfn;
98}
99
100static void p2m_mid_init(unsigned long **mid)
101{
102 unsigned i;
103
104 for (i = 0; i < P2M_MID_PER_PAGE; i++)
105 mid[i] = p2m_missing;
106}
107
108static void p2m_mid_mfn_init(unsigned long *mid)
109{
110 unsigned i;
111
112 for (i = 0; i < P2M_MID_PER_PAGE; i++)
113 mid[i] = virt_to_mfn(p2m_missing);
114}
115
116static void p2m_init(unsigned long *p2m)
117{
118 unsigned i;
119
120 for (i = 0; i < P2M_MID_PER_PAGE; i++)
121 p2m[i] = INVALID_P2M_ENTRY;
122}
123
124/*
125 * Build the parallel p2m_top_mfn and p2m_mid_mfn structures
126 *
127 * This is called both at boot time, and after resuming from suspend:
128 * - At boot time we're called very early, and must use extend_brk()
129 * to allocate memory.
130 *
131 * - After resume we're called from within stop_machine, but the mfn
132 * tree should alreay be completely allocated.
133 */
134void xen_build_mfn_list_list(void)
135{
136 unsigned long pfn;
137
138 /* Pre-initialize p2m_top_mfn to be completely missing */
139 if (p2m_top_mfn == NULL) {
140 p2m_mid_missing_mfn = extend_brk(PAGE_SIZE, PAGE_SIZE);
141 p2m_mid_mfn_init(p2m_mid_missing_mfn);
142
143 p2m_top_mfn_p = extend_brk(PAGE_SIZE, PAGE_SIZE);
144 p2m_top_mfn_p_init(p2m_top_mfn_p);
145
146 p2m_top_mfn = extend_brk(PAGE_SIZE, PAGE_SIZE);
147 p2m_top_mfn_init(p2m_top_mfn);
148 } else {
149 /* Reinitialise, mfn's all change after migration */
150 p2m_mid_mfn_init(p2m_mid_missing_mfn);
151 }
152
153 for (pfn = 0; pfn < xen_max_p2m_pfn; pfn += P2M_PER_PAGE) {
154 unsigned topidx = p2m_top_index(pfn);
155 unsigned mididx = p2m_mid_index(pfn);
156 unsigned long **mid;
157 unsigned long *mid_mfn_p;
158
159 mid = p2m_top[topidx];
160 mid_mfn_p = p2m_top_mfn_p[topidx];
161
162 /* Don't bother allocating any mfn mid levels if
163 * they're just missing, just update the stored mfn,
164 * since all could have changed over a migrate.
165 */
166 if (mid == p2m_mid_missing) {
167 BUG_ON(mididx);
168 BUG_ON(mid_mfn_p != p2m_mid_missing_mfn);
169 p2m_top_mfn[topidx] = virt_to_mfn(p2m_mid_missing_mfn);
170 pfn += (P2M_MID_PER_PAGE - 1) * P2M_PER_PAGE;
171 continue;
172 }
173
174 if (mid_mfn_p == p2m_mid_missing_mfn) {
175 /*
176 * XXX boot-time only! We should never find
177 * missing parts of the mfn tree after
178 * runtime. extend_brk() will BUG if we call
179 * it too late.
180 */
181 mid_mfn_p = extend_brk(PAGE_SIZE, PAGE_SIZE);
182 p2m_mid_mfn_init(mid_mfn_p);
183
184 p2m_top_mfn_p[topidx] = mid_mfn_p;
185 }
186
187 p2m_top_mfn[topidx] = virt_to_mfn(mid_mfn_p);
188 mid_mfn_p[mididx] = virt_to_mfn(mid[mididx]);
189 }
190}
191
192void xen_setup_mfn_list_list(void)
193{
194 BUG_ON(HYPERVISOR_shared_info == &xen_dummy_shared_info);
195
196 HYPERVISOR_shared_info->arch.pfn_to_mfn_frame_list_list =
197 virt_to_mfn(p2m_top_mfn);
198 HYPERVISOR_shared_info->arch.max_pfn = xen_max_p2m_pfn;
199}
200
201/* Set up p2m_top to point to the domain-builder provided p2m pages */
202void __init xen_build_dynamic_phys_to_machine(void)
203{
204 unsigned long *mfn_list = (unsigned long *)xen_start_info->mfn_list;
205 unsigned long max_pfn = min(MAX_DOMAIN_PAGES, xen_start_info->nr_pages);
206 unsigned long pfn;
207
208 xen_max_p2m_pfn = max_pfn;
209
210 p2m_missing = extend_brk(PAGE_SIZE, PAGE_SIZE);
211 p2m_init(p2m_missing);
212
213 p2m_mid_missing = extend_brk(PAGE_SIZE, PAGE_SIZE);
214 p2m_mid_init(p2m_mid_missing);
215
216 p2m_top = extend_brk(PAGE_SIZE, PAGE_SIZE);
217 p2m_top_init(p2m_top);
218
219 /*
220 * The domain builder gives us a pre-constructed p2m array in
221 * mfn_list for all the pages initially given to us, so we just
222 * need to graft that into our tree structure.
223 */
224 for (pfn = 0; pfn < max_pfn; pfn += P2M_PER_PAGE) {
225 unsigned topidx = p2m_top_index(pfn);
226 unsigned mididx = p2m_mid_index(pfn);
227
228 if (p2m_top[topidx] == p2m_mid_missing) {
229 unsigned long **mid = extend_brk(PAGE_SIZE, PAGE_SIZE);
230 p2m_mid_init(mid);
231
232 p2m_top[topidx] = mid;
233 }
234
235 p2m_top[topidx][mididx] = &mfn_list[pfn];
236 }
237}
238
239unsigned long get_phys_to_machine(unsigned long pfn)
240{
241 unsigned topidx, mididx, idx;
242
243 if (unlikely(pfn >= MAX_P2M_PFN))
244 return INVALID_P2M_ENTRY;
245
246 topidx = p2m_top_index(pfn);
247 mididx = p2m_mid_index(pfn);
248 idx = p2m_index(pfn);
249
250 return p2m_top[topidx][mididx][idx];
251}
252EXPORT_SYMBOL_GPL(get_phys_to_machine);
253
254static void *alloc_p2m_page(void)
255{
256 return (void *)__get_free_page(GFP_KERNEL | __GFP_REPEAT);
257}
258
259static void free_p2m_page(void *p)
260{
261 free_page((unsigned long)p);
262}
263
264/*
265 * Fully allocate the p2m structure for a given pfn. We need to check
266 * that both the top and mid levels are allocated, and make sure the
267 * parallel mfn tree is kept in sync. We may race with other cpus, so
268 * the new pages are installed with cmpxchg; if we lose the race then
269 * simply free the page we allocated and use the one that's there.
270 */
271static bool alloc_p2m(unsigned long pfn)
272{
273 unsigned topidx, mididx;
274 unsigned long ***top_p, **mid;
275 unsigned long *top_mfn_p, *mid_mfn;
276
277 topidx = p2m_top_index(pfn);
278 mididx = p2m_mid_index(pfn);
279
280 top_p = &p2m_top[topidx];
281 mid = *top_p;
282
283 if (mid == p2m_mid_missing) {
284 /* Mid level is missing, allocate a new one */
285 mid = alloc_p2m_page();
286 if (!mid)
287 return false;
288
289 p2m_mid_init(mid);
290
291 if (cmpxchg(top_p, p2m_mid_missing, mid) != p2m_mid_missing)
292 free_p2m_page(mid);
293 }
294
295 top_mfn_p = &p2m_top_mfn[topidx];
296 mid_mfn = p2m_top_mfn_p[topidx];
297
298 BUG_ON(virt_to_mfn(mid_mfn) != *top_mfn_p);
299
300 if (mid_mfn == p2m_mid_missing_mfn) {
301 /* Separately check the mid mfn level */
302 unsigned long missing_mfn;
303 unsigned long mid_mfn_mfn;
304
305 mid_mfn = alloc_p2m_page();
306 if (!mid_mfn)
307 return false;
308
309 p2m_mid_mfn_init(mid_mfn);
310
311 missing_mfn = virt_to_mfn(p2m_mid_missing_mfn);
312 mid_mfn_mfn = virt_to_mfn(mid_mfn);
313 if (cmpxchg(top_mfn_p, missing_mfn, mid_mfn_mfn) != missing_mfn)
314 free_p2m_page(mid_mfn);
315 else
316 p2m_top_mfn_p[topidx] = mid_mfn;
317 }
318
319 if (p2m_top[topidx][mididx] == p2m_missing) {
320 /* p2m leaf page is missing */
321 unsigned long *p2m;
322
323 p2m = alloc_p2m_page();
324 if (!p2m)
325 return false;
326
327 p2m_init(p2m);
328
329 if (cmpxchg(&mid[mididx], p2m_missing, p2m) != p2m_missing)
330 free_p2m_page(p2m);
331 else
332 mid_mfn[mididx] = virt_to_mfn(p2m);
333 }
334
335 return true;
336}
337
338/* Try to install p2m mapping; fail if intermediate bits missing */
339bool __set_phys_to_machine(unsigned long pfn, unsigned long mfn)
340{
341 unsigned topidx, mididx, idx;
342
343 if (unlikely(pfn >= MAX_P2M_PFN)) {
344 BUG_ON(mfn != INVALID_P2M_ENTRY);
345 return true;
346 }
347
348 topidx = p2m_top_index(pfn);
349 mididx = p2m_mid_index(pfn);
350 idx = p2m_index(pfn);
351
352 if (p2m_top[topidx][mididx] == p2m_missing)
353 return mfn == INVALID_P2M_ENTRY;
354
355 p2m_top[topidx][mididx][idx] = mfn;
356
357 return true;
358}
359
360bool set_phys_to_machine(unsigned long pfn, unsigned long mfn)
361{
362 if (unlikely(xen_feature(XENFEAT_auto_translated_physmap))) {
363 BUG_ON(pfn != mfn && mfn != INVALID_P2M_ENTRY);
364 return true;
365 }
366
367 if (unlikely(!__set_phys_to_machine(pfn, mfn))) {
368 if (!alloc_p2m(pfn))
369 return false;
370
371 if (!__set_phys_to_machine(pfn, mfn))
372 return false;
373 }
374
375 return true;
376}