]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - drivers/xen/grant-table.c
xen/pvh: Fix misplaced kfree from xlated_setup_gnttab_pages
[mirror_ubuntu-artful-kernel.git] / drivers / xen / grant-table.c
CommitLineData
ad9a8612
JF
1/******************************************************************************
2 * grant_table.c
3 *
4 * Granting foreign access to our memory reservation.
5 *
6 * Copyright (c) 2005-2006, Christopher Clark
7 * Copyright (c) 2004-2005, K A Fraser
8 *
9 * This program is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU General Public License version 2
11 * as published by the Free Software Foundation; or, when distributed
12 * separately from the Linux kernel or incorporated into other
13 * software packages, subject to the following license:
14 *
15 * Permission is hereby granted, free of charge, to any person obtaining a copy
16 * of this source file (the "Software"), to deal in the Software without
17 * restriction, including without limitation the rights to use, copy, modify,
18 * merge, publish, distribute, sublicense, and/or sell copies of the Software,
19 * and to permit persons to whom the Software is furnished to do so, subject to
20 * the following conditions:
21 *
22 * The above copyright notice and this permission notice shall be included in
23 * all copies or substantial portions of the Software.
24 *
25 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
26 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
27 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
28 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
29 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
30 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
31 * IN THE SOFTWARE.
32 */
33
283c0972
JP
34#define pr_fmt(fmt) "xen:" KBUILD_MODNAME ": " fmt
35
ad9a8612
JF
36#include <linux/module.h>
37#include <linux/sched.h>
38#include <linux/mm.h>
5a0e3ad6 39#include <linux/slab.h>
ad9a8612
JF
40#include <linux/vmalloc.h>
41#include <linux/uaccess.h>
183d03cc 42#include <linux/io.h>
c571898f 43#include <linux/delay.h>
f62805f1 44#include <linux/hardirq.h>
ad9a8612 45
1ccbf534 46#include <xen/xen.h>
ad9a8612
JF
47#include <xen/interface/xen.h>
48#include <xen/page.h>
49#include <xen/grant_table.h>
183d03cc 50#include <xen/interface/memory.h>
85ff6acb 51#include <xen/hvc-console.h>
3d24bbd7 52#include <xen/swiotlb-xen.h>
ecbf29cd 53#include <asm/xen/hypercall.h>
4d9310e3 54#include <asm/xen/interface.h>
ad9a8612
JF
55
56#include <asm/pgtable.h>
57#include <asm/sync_bitops.h>
58
ad9a8612
JF
59/* External tools reserve first few grant table entries. */
60#define NR_RESERVED_ENTRIES 8
61#define GNTTAB_LIST_END 0xffffffff
ad9a8612
JF
62
63static grant_ref_t **gnttab_list;
64static unsigned int nr_grant_frames;
ad9a8612
JF
65static int gnttab_free_count;
66static grant_ref_t gnttab_free_head;
67static DEFINE_SPINLOCK(gnttab_list_lock);
efaf30a3 68struct grant_frames xen_auto_xlat_grant_frames;
ad9a8612 69
0f9f5a95
AL
70static union {
71 struct grant_entry_v1 *v1;
85ff6acb 72 union grant_entry_v2 *v2;
0f9f5a95
AL
73 void *addr;
74} gnttab_shared;
75
76/*This is a structure of function pointers for grant table*/
77struct gnttab_ops {
78 /*
9dbc71d5
AL
79 * Mapping a list of frames for storing grant entries. Frames parameter
80 * is used to store grant table address when grant table being setup,
81 * nr_gframes is the number of frames to map grant table. Returning
82 * GNTST_okay means success and negative value means failure.
0f9f5a95 83 */
ef32f892 84 int (*map_frames)(xen_pfn_t *frames, unsigned int nr_gframes);
0f9f5a95
AL
85 /*
86 * Release a list of frames which are mapped in map_frames for grant
87 * entry status.
88 */
89 void (*unmap_frames)(void);
90 /*
9dbc71d5
AL
91 * Introducing a valid entry into the grant table, granting the frame of
92 * this grant entry to domain for accessing or transfering. Ref
93 * parameter is reference of this introduced grant entry, domid is id of
94 * granted domain, frame is the page frame to be granted, and flags is
95 * status of the grant entry to be updated.
0f9f5a95 96 */
9dbc71d5
AL
97 void (*update_entry)(grant_ref_t ref, domid_t domid,
98 unsigned long frame, unsigned flags);
0f9f5a95 99 /*
9dbc71d5
AL
100 * Stop granting a grant entry to domain for accessing. Ref parameter is
101 * reference of a grant entry whose grant access will be stopped,
102 * readonly is not in use in this function. If the grant entry is
0f9f5a95
AL
103 * currently mapped for reading or writing, just return failure(==0)
104 * directly and don't tear down the grant access. Otherwise, stop grant
105 * access for this entry and return success(==1).
106 */
9dbc71d5 107 int (*end_foreign_access_ref)(grant_ref_t ref, int readonly);
0f9f5a95 108 /*
9dbc71d5
AL
109 * Stop granting a grant entry to domain for transfer. Ref parameter is
110 * reference of a grant entry whose grant transfer will be stopped. If
111 * tranfer has not started, just reclaim the grant entry and return
112 * failure(==0). Otherwise, wait for the transfer to complete and then
113 * return the frame.
0f9f5a95 114 */
9dbc71d5 115 unsigned long (*end_foreign_transfer_ref)(grant_ref_t ref);
0f9f5a95 116 /*
9dbc71d5 117 * Query the status of a grant entry. Ref parameter is reference of
0f9f5a95
AL
118 * queried grant entry, return value is the status of queried entry.
119 * Detailed status(writing/reading) can be gotten from the return value
120 * by bit operations.
121 */
9dbc71d5 122 int (*query_foreign_access)(grant_ref_t ref);
6666754b
AL
123 /*
124 * Grant a domain to access a range of bytes within the page referred by
125 * an available grant entry. Ref parameter is reference of a grant entry
126 * which will be sub-page accessed, domid is id of grantee domain, frame
127 * is frame address of subpage grant, flags is grant type and flag
128 * information, page_off is offset of the range of bytes, and length is
129 * length of bytes to be accessed.
130 */
131 void (*update_subpage_entry)(grant_ref_t ref, domid_t domid,
132 unsigned long frame, int flags,
133 unsigned page_off, unsigned length);
9438ce9d
AL
134 /*
135 * Redirect an available grant entry on domain A to another grant
136 * reference of domain B, then allow domain C to use grant reference
137 * of domain B transitively. Ref parameter is an available grant entry
138 * reference on domain A, domid is id of domain C which accesses grant
139 * entry transitively, flags is grant type and flag information,
140 * trans_domid is id of domain B whose grant entry is finally accessed
141 * transitively, trans_gref is grant entry transitive reference of
142 * domain B.
143 */
144 void (*update_trans_entry)(grant_ref_t ref, domid_t domid, int flags,
145 domid_t trans_domid, grant_ref_t trans_gref);
0f9f5a95
AL
146};
147
148static struct gnttab_ops *gnttab_interface;
149
85ff6acb
AL
150/*This reflects status of grant entries, so act as a global value*/
151static grant_status_t *grstatus;
152
0f9f5a95 153static int grant_table_version;
d0b4d64a 154static int grefs_per_grant_frame;
ad9a8612
JF
155
156static struct gnttab_free_callback *gnttab_free_callback_list;
157
158static int gnttab_expand(unsigned int req_entries);
159
160#define RPP (PAGE_SIZE / sizeof(grant_ref_t))
85ff6acb 161#define SPP (PAGE_SIZE / sizeof(grant_status_t))
ad9a8612
JF
162
163static inline grant_ref_t *__gnttab_entry(grant_ref_t entry)
164{
165 return &gnttab_list[(entry) / RPP][(entry) % RPP];
166}
167/* This can be used as an l-value */
168#define gnttab_entry(entry) (*__gnttab_entry(entry))
169
170static int get_free_entries(unsigned count)
171{
172 unsigned long flags;
272800dc 173 int ref, rc = 0;
ad9a8612
JF
174 grant_ref_t head;
175
176 spin_lock_irqsave(&gnttab_list_lock, flags);
177
178 if ((gnttab_free_count < count) &&
179 ((rc = gnttab_expand(count - gnttab_free_count)) < 0)) {
180 spin_unlock_irqrestore(&gnttab_list_lock, flags);
181 return rc;
182 }
183
184 ref = head = gnttab_free_head;
185 gnttab_free_count -= count;
186 while (count-- > 1)
187 head = gnttab_entry(head);
188 gnttab_free_head = gnttab_entry(head);
189 gnttab_entry(head) = GNTTAB_LIST_END;
190
191 spin_unlock_irqrestore(&gnttab_list_lock, flags);
192
193 return ref;
194}
195
196static void do_free_callbacks(void)
197{
198 struct gnttab_free_callback *callback, *next;
199
200 callback = gnttab_free_callback_list;
201 gnttab_free_callback_list = NULL;
202
203 while (callback != NULL) {
204 next = callback->next;
205 if (gnttab_free_count >= callback->count) {
206 callback->next = NULL;
207 callback->fn(callback->arg);
208 } else {
209 callback->next = gnttab_free_callback_list;
210 gnttab_free_callback_list = callback;
211 }
212 callback = next;
213 }
214}
215
216static inline void check_free_callbacks(void)
217{
218 if (unlikely(gnttab_free_callback_list))
219 do_free_callbacks();
220}
221
222static void put_free_entry(grant_ref_t ref)
223{
224 unsigned long flags;
225 spin_lock_irqsave(&gnttab_list_lock, flags);
226 gnttab_entry(ref) = gnttab_free_head;
227 gnttab_free_head = ref;
228 gnttab_free_count++;
229 check_free_callbacks();
230 spin_unlock_irqrestore(&gnttab_list_lock, flags);
231}
232
0f9f5a95 233/*
85ff6acb 234 * Following applies to gnttab_update_entry_v1 and gnttab_update_entry_v2.
0f9f5a95
AL
235 * Introducing a valid entry into the grant table:
236 * 1. Write ent->domid.
237 * 2. Write ent->frame:
238 * GTF_permit_access: Frame to which access is permitted.
239 * GTF_accept_transfer: Pseudo-phys frame slot being filled by new
240 * frame, or zero if none.
241 * 3. Write memory barrier (WMB).
242 * 4. Write ent->flags, inc. valid type.
243 */
244static void gnttab_update_entry_v1(grant_ref_t ref, domid_t domid,
245 unsigned long frame, unsigned flags)
ad9a8612 246{
0f9f5a95
AL
247 gnttab_shared.v1[ref].domid = domid;
248 gnttab_shared.v1[ref].frame = frame;
ad9a8612 249 wmb();
0f9f5a95 250 gnttab_shared.v1[ref].flags = flags;
ad9a8612
JF
251}
252
85ff6acb
AL
253static void gnttab_update_entry_v2(grant_ref_t ref, domid_t domid,
254 unsigned long frame, unsigned flags)
255{
256 gnttab_shared.v2[ref].hdr.domid = domid;
257 gnttab_shared.v2[ref].full_page.frame = frame;
258 wmb();
259 gnttab_shared.v2[ref].hdr.flags = GTF_permit_access | flags;
260}
261
ad9a8612
JF
262/*
263 * Public grant-issuing interface functions
264 */
265void gnttab_grant_foreign_access_ref(grant_ref_t ref, domid_t domid,
266 unsigned long frame, int readonly)
267{
0f9f5a95 268 gnttab_interface->update_entry(ref, domid, frame,
ad9a8612
JF
269 GTF_permit_access | (readonly ? GTF_readonly : 0));
270}
271EXPORT_SYMBOL_GPL(gnttab_grant_foreign_access_ref);
272
273int gnttab_grant_foreign_access(domid_t domid, unsigned long frame,
274 int readonly)
275{
276 int ref;
277
278 ref = get_free_entries(1);
279 if (unlikely(ref < 0))
280 return -ENOSPC;
281
282 gnttab_grant_foreign_access_ref(ref, domid, frame, readonly);
283
284 return ref;
285}
286EXPORT_SYMBOL_GPL(gnttab_grant_foreign_access);
287
b8b0f559
KRW
288static void gnttab_update_subpage_entry_v2(grant_ref_t ref, domid_t domid,
289 unsigned long frame, int flags,
290 unsigned page_off, unsigned length)
6666754b
AL
291{
292 gnttab_shared.v2[ref].sub_page.frame = frame;
293 gnttab_shared.v2[ref].sub_page.page_off = page_off;
294 gnttab_shared.v2[ref].sub_page.length = length;
295 gnttab_shared.v2[ref].hdr.domid = domid;
296 wmb();
297 gnttab_shared.v2[ref].hdr.flags =
298 GTF_permit_access | GTF_sub_page | flags;
299}
300
301int gnttab_grant_foreign_access_subpage_ref(grant_ref_t ref, domid_t domid,
302 unsigned long frame, int flags,
303 unsigned page_off,
304 unsigned length)
305{
306 if (flags & (GTF_accept_transfer | GTF_reading |
307 GTF_writing | GTF_transitive))
308 return -EPERM;
309
310 if (gnttab_interface->update_subpage_entry == NULL)
311 return -ENOSYS;
312
313 gnttab_interface->update_subpage_entry(ref, domid, frame, flags,
314 page_off, length);
315
316 return 0;
317}
318EXPORT_SYMBOL_GPL(gnttab_grant_foreign_access_subpage_ref);
319
320int gnttab_grant_foreign_access_subpage(domid_t domid, unsigned long frame,
321 int flags, unsigned page_off,
322 unsigned length)
323{
324 int ref, rc;
325
326 ref = get_free_entries(1);
327 if (unlikely(ref < 0))
328 return -ENOSPC;
329
330 rc = gnttab_grant_foreign_access_subpage_ref(ref, domid, frame, flags,
331 page_off, length);
332 if (rc < 0) {
333 put_free_entry(ref);
334 return rc;
335 }
336
337 return ref;
338}
339EXPORT_SYMBOL_GPL(gnttab_grant_foreign_access_subpage);
340
341bool gnttab_subpage_grants_available(void)
342{
343 return gnttab_interface->update_subpage_entry != NULL;
344}
345EXPORT_SYMBOL_GPL(gnttab_subpage_grants_available);
346
b8b0f559
KRW
347static void gnttab_update_trans_entry_v2(grant_ref_t ref, domid_t domid,
348 int flags, domid_t trans_domid,
349 grant_ref_t trans_gref)
9438ce9d
AL
350{
351 gnttab_shared.v2[ref].transitive.trans_domid = trans_domid;
352 gnttab_shared.v2[ref].transitive.gref = trans_gref;
353 gnttab_shared.v2[ref].hdr.domid = domid;
354 wmb();
355 gnttab_shared.v2[ref].hdr.flags =
356 GTF_permit_access | GTF_transitive | flags;
357}
358
359int gnttab_grant_foreign_access_trans_ref(grant_ref_t ref, domid_t domid,
360 int flags, domid_t trans_domid,
361 grant_ref_t trans_gref)
362{
363 if (flags & (GTF_accept_transfer | GTF_reading |
364 GTF_writing | GTF_sub_page))
365 return -EPERM;
366
367 if (gnttab_interface->update_trans_entry == NULL)
368 return -ENOSYS;
369
370 gnttab_interface->update_trans_entry(ref, domid, flags, trans_domid,
371 trans_gref);
372
373 return 0;
374}
375EXPORT_SYMBOL_GPL(gnttab_grant_foreign_access_trans_ref);
376
377int gnttab_grant_foreign_access_trans(domid_t domid, int flags,
378 domid_t trans_domid,
379 grant_ref_t trans_gref)
380{
381 int ref, rc;
382
383 ref = get_free_entries(1);
384 if (unlikely(ref < 0))
385 return -ENOSPC;
386
387 rc = gnttab_grant_foreign_access_trans_ref(ref, domid, flags,
388 trans_domid, trans_gref);
389 if (rc < 0) {
390 put_free_entry(ref);
391 return rc;
392 }
393
394 return ref;
395}
396EXPORT_SYMBOL_GPL(gnttab_grant_foreign_access_trans);
397
398bool gnttab_trans_grants_available(void)
399{
400 return gnttab_interface->update_trans_entry != NULL;
401}
402EXPORT_SYMBOL_GPL(gnttab_trans_grants_available);
403
0f9f5a95 404static int gnttab_query_foreign_access_v1(grant_ref_t ref)
ad9a8612 405{
0f9f5a95
AL
406 return gnttab_shared.v1[ref].flags & (GTF_reading|GTF_writing);
407}
ad9a8612 408
85ff6acb
AL
409static int gnttab_query_foreign_access_v2(grant_ref_t ref)
410{
411 return grstatus[ref] & (GTF_reading|GTF_writing);
412}
413
0f9f5a95
AL
414int gnttab_query_foreign_access(grant_ref_t ref)
415{
416 return gnttab_interface->query_foreign_access(ref);
ad9a8612
JF
417}
418EXPORT_SYMBOL_GPL(gnttab_query_foreign_access);
419
0f9f5a95 420static int gnttab_end_foreign_access_ref_v1(grant_ref_t ref, int readonly)
ad9a8612
JF
421{
422 u16 flags, nflags;
b1e495b2 423 u16 *pflags;
ad9a8612 424
b1e495b2
AL
425 pflags = &gnttab_shared.v1[ref].flags;
426 nflags = *pflags;
ad9a8612
JF
427 do {
428 flags = nflags;
569ca5b3 429 if (flags & (GTF_reading|GTF_writing))
ad9a8612 430 return 0;
b1e495b2 431 } while ((nflags = sync_cmpxchg(pflags, flags, 0)) != flags);
ad9a8612
JF
432
433 return 1;
434}
0f9f5a95 435
85ff6acb
AL
436static int gnttab_end_foreign_access_ref_v2(grant_ref_t ref, int readonly)
437{
438 gnttab_shared.v2[ref].hdr.flags = 0;
439 mb();
440 if (grstatus[ref] & (GTF_reading|GTF_writing)) {
441 return 0;
442 } else {
443 /* The read of grstatus needs to have acquire
444 semantics. On x86, reads already have
445 that, and we just need to protect against
446 compiler reorderings. On other
447 architectures we may need a full
448 barrier. */
449#ifdef CONFIG_X86
450 barrier();
451#else
452 mb();
453#endif
454 }
455
456 return 1;
457}
458
569ca5b3 459static inline int _gnttab_end_foreign_access_ref(grant_ref_t ref, int readonly)
0f9f5a95
AL
460{
461 return gnttab_interface->end_foreign_access_ref(ref, readonly);
462}
569ca5b3
JB
463
464int gnttab_end_foreign_access_ref(grant_ref_t ref, int readonly)
465{
466 if (_gnttab_end_foreign_access_ref(ref, readonly))
467 return 1;
468 pr_warn("WARNING: g.e. %#x still in use!\n", ref);
469 return 0;
470}
ad9a8612
JF
471EXPORT_SYMBOL_GPL(gnttab_end_foreign_access_ref);
472
569ca5b3
JB
473struct deferred_entry {
474 struct list_head list;
475 grant_ref_t ref;
476 bool ro;
477 uint16_t warn_delay;
478 struct page *page;
479};
480static LIST_HEAD(deferred_list);
481static void gnttab_handle_deferred(unsigned long);
482static DEFINE_TIMER(deferred_timer, gnttab_handle_deferred, 0, 0);
483
484static void gnttab_handle_deferred(unsigned long unused)
485{
486 unsigned int nr = 10;
487 struct deferred_entry *first = NULL;
488 unsigned long flags;
489
490 spin_lock_irqsave(&gnttab_list_lock, flags);
491 while (nr--) {
492 struct deferred_entry *entry
493 = list_first_entry(&deferred_list,
494 struct deferred_entry, list);
495
496 if (entry == first)
497 break;
498 list_del(&entry->list);
499 spin_unlock_irqrestore(&gnttab_list_lock, flags);
500 if (_gnttab_end_foreign_access_ref(entry->ref, entry->ro)) {
501 put_free_entry(entry->ref);
502 if (entry->page) {
503 pr_debug("freeing g.e. %#x (pfn %#lx)\n",
504 entry->ref, page_to_pfn(entry->page));
505 __free_page(entry->page);
506 } else
507 pr_info("freeing g.e. %#x\n", entry->ref);
508 kfree(entry);
509 entry = NULL;
510 } else {
511 if (!--entry->warn_delay)
283c0972 512 pr_info("g.e. %#x still pending\n", entry->ref);
569ca5b3
JB
513 if (!first)
514 first = entry;
515 }
516 spin_lock_irqsave(&gnttab_list_lock, flags);
517 if (entry)
518 list_add_tail(&entry->list, &deferred_list);
519 else if (list_empty(&deferred_list))
520 break;
521 }
522 if (!list_empty(&deferred_list) && !timer_pending(&deferred_timer)) {
523 deferred_timer.expires = jiffies + HZ;
524 add_timer(&deferred_timer);
525 }
526 spin_unlock_irqrestore(&gnttab_list_lock, flags);
527}
528
529static void gnttab_add_deferred(grant_ref_t ref, bool readonly,
530 struct page *page)
531{
532 struct deferred_entry *entry = kmalloc(sizeof(*entry), GFP_ATOMIC);
533 const char *what = KERN_WARNING "leaking";
534
535 if (entry) {
536 unsigned long flags;
537
538 entry->ref = ref;
539 entry->ro = readonly;
540 entry->page = page;
541 entry->warn_delay = 60;
542 spin_lock_irqsave(&gnttab_list_lock, flags);
543 list_add_tail(&entry->list, &deferred_list);
544 if (!timer_pending(&deferred_timer)) {
545 deferred_timer.expires = jiffies + HZ;
546 add_timer(&deferred_timer);
547 }
548 spin_unlock_irqrestore(&gnttab_list_lock, flags);
549 what = KERN_DEBUG "deferring";
550 }
551 printk("%s g.e. %#x (pfn %#lx)\n",
552 what, ref, page ? page_to_pfn(page) : -1);
553}
554
ad9a8612
JF
555void gnttab_end_foreign_access(grant_ref_t ref, int readonly,
556 unsigned long page)
557{
558 if (gnttab_end_foreign_access_ref(ref, readonly)) {
559 put_free_entry(ref);
560 if (page != 0)
561 free_page(page);
569ca5b3
JB
562 } else
563 gnttab_add_deferred(ref, readonly,
564 page ? virt_to_page(page) : NULL);
ad9a8612
JF
565}
566EXPORT_SYMBOL_GPL(gnttab_end_foreign_access);
567
568int gnttab_grant_foreign_transfer(domid_t domid, unsigned long pfn)
569{
570 int ref;
571
572 ref = get_free_entries(1);
573 if (unlikely(ref < 0))
574 return -ENOSPC;
575 gnttab_grant_foreign_transfer_ref(ref, domid, pfn);
576
577 return ref;
578}
579EXPORT_SYMBOL_GPL(gnttab_grant_foreign_transfer);
580
581void gnttab_grant_foreign_transfer_ref(grant_ref_t ref, domid_t domid,
582 unsigned long pfn)
583{
0f9f5a95 584 gnttab_interface->update_entry(ref, domid, pfn, GTF_accept_transfer);
ad9a8612
JF
585}
586EXPORT_SYMBOL_GPL(gnttab_grant_foreign_transfer_ref);
587
0f9f5a95 588static unsigned long gnttab_end_foreign_transfer_ref_v1(grant_ref_t ref)
ad9a8612
JF
589{
590 unsigned long frame;
591 u16 flags;
b1e495b2
AL
592 u16 *pflags;
593
594 pflags = &gnttab_shared.v1[ref].flags;
ad9a8612
JF
595
596 /*
597 * If a transfer is not even yet started, try to reclaim the grant
598 * reference and return failure (== 0).
599 */
b1e495b2
AL
600 while (!((flags = *pflags) & GTF_transfer_committed)) {
601 if (sync_cmpxchg(pflags, flags, 0) == flags)
ad9a8612
JF
602 return 0;
603 cpu_relax();
604 }
605
606 /* If a transfer is in progress then wait until it is completed. */
607 while (!(flags & GTF_transfer_completed)) {
b1e495b2 608 flags = *pflags;
ad9a8612
JF
609 cpu_relax();
610 }
611
612 rmb(); /* Read the frame number /after/ reading completion status. */
0f9f5a95 613 frame = gnttab_shared.v1[ref].frame;
ad9a8612
JF
614 BUG_ON(frame == 0);
615
616 return frame;
617}
0f9f5a95 618
85ff6acb
AL
619static unsigned long gnttab_end_foreign_transfer_ref_v2(grant_ref_t ref)
620{
621 unsigned long frame;
622 u16 flags;
623 u16 *pflags;
624
625 pflags = &gnttab_shared.v2[ref].hdr.flags;
626
627 /*
628 * If a transfer is not even yet started, try to reclaim the grant
629 * reference and return failure (== 0).
630 */
631 while (!((flags = *pflags) & GTF_transfer_committed)) {
632 if (sync_cmpxchg(pflags, flags, 0) == flags)
633 return 0;
634 cpu_relax();
635 }
636
637 /* If a transfer is in progress then wait until it is completed. */
638 while (!(flags & GTF_transfer_completed)) {
639 flags = *pflags;
640 cpu_relax();
641 }
642
643 rmb(); /* Read the frame number /after/ reading completion status. */
644 frame = gnttab_shared.v2[ref].full_page.frame;
645 BUG_ON(frame == 0);
646
647 return frame;
648}
649
0f9f5a95
AL
650unsigned long gnttab_end_foreign_transfer_ref(grant_ref_t ref)
651{
652 return gnttab_interface->end_foreign_transfer_ref(ref);
653}
ad9a8612
JF
654EXPORT_SYMBOL_GPL(gnttab_end_foreign_transfer_ref);
655
656unsigned long gnttab_end_foreign_transfer(grant_ref_t ref)
657{
658 unsigned long frame = gnttab_end_foreign_transfer_ref(ref);
659 put_free_entry(ref);
660 return frame;
661}
662EXPORT_SYMBOL_GPL(gnttab_end_foreign_transfer);
663
664void gnttab_free_grant_reference(grant_ref_t ref)
665{
666 put_free_entry(ref);
667}
668EXPORT_SYMBOL_GPL(gnttab_free_grant_reference);
669
670void gnttab_free_grant_references(grant_ref_t head)
671{
672 grant_ref_t ref;
673 unsigned long flags;
674 int count = 1;
675 if (head == GNTTAB_LIST_END)
676 return;
677 spin_lock_irqsave(&gnttab_list_lock, flags);
678 ref = head;
679 while (gnttab_entry(ref) != GNTTAB_LIST_END) {
680 ref = gnttab_entry(ref);
681 count++;
682 }
683 gnttab_entry(ref) = gnttab_free_head;
684 gnttab_free_head = head;
685 gnttab_free_count += count;
686 check_free_callbacks();
687 spin_unlock_irqrestore(&gnttab_list_lock, flags);
688}
689EXPORT_SYMBOL_GPL(gnttab_free_grant_references);
690
691int gnttab_alloc_grant_references(u16 count, grant_ref_t *head)
692{
693 int h = get_free_entries(count);
694
695 if (h < 0)
696 return -ENOSPC;
697
698 *head = h;
699
700 return 0;
701}
702EXPORT_SYMBOL_GPL(gnttab_alloc_grant_references);
703
704int gnttab_empty_grant_references(const grant_ref_t *private_head)
705{
706 return (*private_head == GNTTAB_LIST_END);
707}
708EXPORT_SYMBOL_GPL(gnttab_empty_grant_references);
709
710int gnttab_claim_grant_reference(grant_ref_t *private_head)
711{
712 grant_ref_t g = *private_head;
713 if (unlikely(g == GNTTAB_LIST_END))
714 return -ENOSPC;
715 *private_head = gnttab_entry(g);
716 return g;
717}
718EXPORT_SYMBOL_GPL(gnttab_claim_grant_reference);
719
720void gnttab_release_grant_reference(grant_ref_t *private_head,
721 grant_ref_t release)
722{
723 gnttab_entry(release) = *private_head;
724 *private_head = release;
725}
726EXPORT_SYMBOL_GPL(gnttab_release_grant_reference);
727
728void gnttab_request_free_callback(struct gnttab_free_callback *callback,
729 void (*fn)(void *), void *arg, u16 count)
730{
731 unsigned long flags;
5f338d90
RPM
732 struct gnttab_free_callback *cb;
733
ad9a8612 734 spin_lock_irqsave(&gnttab_list_lock, flags);
5f338d90
RPM
735
736 /* Check if the callback is already on the list */
737 cb = gnttab_free_callback_list;
738 while (cb) {
739 if (cb == callback)
740 goto out;
741 cb = cb->next;
742 }
743
ad9a8612
JF
744 callback->fn = fn;
745 callback->arg = arg;
746 callback->count = count;
747 callback->next = gnttab_free_callback_list;
748 gnttab_free_callback_list = callback;
749 check_free_callbacks();
750out:
751 spin_unlock_irqrestore(&gnttab_list_lock, flags);
752}
753EXPORT_SYMBOL_GPL(gnttab_request_free_callback);
754
755void gnttab_cancel_free_callback(struct gnttab_free_callback *callback)
756{
757 struct gnttab_free_callback **pcb;
758 unsigned long flags;
759
760 spin_lock_irqsave(&gnttab_list_lock, flags);
761 for (pcb = &gnttab_free_callback_list; *pcb; pcb = &(*pcb)->next) {
762 if (*pcb == callback) {
763 *pcb = callback->next;
764 break;
765 }
766 }
767 spin_unlock_irqrestore(&gnttab_list_lock, flags);
768}
769EXPORT_SYMBOL_GPL(gnttab_cancel_free_callback);
770
771static int grow_gnttab_list(unsigned int more_frames)
772{
773 unsigned int new_nr_grant_frames, extra_entries, i;
bbc60c18 774 unsigned int nr_glist_frames, new_nr_glist_frames;
ad9a8612 775
d0b4d64a
MW
776 BUG_ON(grefs_per_grant_frame == 0);
777
ad9a8612 778 new_nr_grant_frames = nr_grant_frames + more_frames;
d0b4d64a 779 extra_entries = more_frames * grefs_per_grant_frame;
ad9a8612 780
d0b4d64a 781 nr_glist_frames = (nr_grant_frames * grefs_per_grant_frame + RPP - 1) / RPP;
bbc60c18 782 new_nr_glist_frames =
d0b4d64a 783 (new_nr_grant_frames * grefs_per_grant_frame + RPP - 1) / RPP;
bbc60c18 784 for (i = nr_glist_frames; i < new_nr_glist_frames; i++) {
ad9a8612
JF
785 gnttab_list[i] = (grant_ref_t *)__get_free_page(GFP_ATOMIC);
786 if (!gnttab_list[i])
787 goto grow_nomem;
788 }
789
790
d0b4d64a
MW
791 for (i = grefs_per_grant_frame * nr_grant_frames;
792 i < grefs_per_grant_frame * new_nr_grant_frames - 1; i++)
ad9a8612
JF
793 gnttab_entry(i) = i + 1;
794
795 gnttab_entry(i) = gnttab_free_head;
d0b4d64a 796 gnttab_free_head = grefs_per_grant_frame * nr_grant_frames;
ad9a8612
JF
797 gnttab_free_count += extra_entries;
798
799 nr_grant_frames = new_nr_grant_frames;
800
801 check_free_callbacks();
802
803 return 0;
804
805grow_nomem:
bbc60c18 806 for ( ; i >= nr_glist_frames; i--)
ad9a8612
JF
807 free_page((unsigned long) gnttab_list[i]);
808 return -ENOMEM;
809}
810
811static unsigned int __max_nr_grant_frames(void)
812{
813 struct gnttab_query_size query;
814 int rc;
815
816 query.dom = DOMID_SELF;
817
818 rc = HYPERVISOR_grant_table_op(GNTTABOP_query_size, &query, 1);
819 if ((rc < 0) || (query.status != GNTST_okay))
820 return 4; /* Legacy max supported number of frames */
821
822 return query.max_nr_frames;
823}
824
183d03cc 825unsigned int gnttab_max_grant_frames(void)
ad9a8612
JF
826{
827 unsigned int xen_max = __max_nr_grant_frames();
7f256020
KRW
828 static unsigned int boot_max_nr_grant_frames;
829
830 /* First time, initialize it properly. */
831 if (!boot_max_nr_grant_frames)
832 boot_max_nr_grant_frames = __max_nr_grant_frames();
ad9a8612
JF
833
834 if (xen_max > boot_max_nr_grant_frames)
835 return boot_max_nr_grant_frames;
836 return xen_max;
837}
183d03cc 838EXPORT_SYMBOL_GPL(gnttab_max_grant_frames);
ad9a8612 839
47c54205 840int gnttab_setup_auto_xlat_frames(phys_addr_t addr)
efaf30a3
KRW
841{
842 xen_pfn_t *pfn;
843 unsigned int max_nr_gframes = __max_nr_grant_frames();
844 unsigned int i;
845 void *vaddr;
846
847 if (xen_auto_xlat_grant_frames.count)
848 return -EINVAL;
849
850 vaddr = xen_remap(addr, PAGE_SIZE * max_nr_gframes);
851 if (vaddr == NULL) {
47c54205
JG
852 pr_warn("Failed to ioremap gnttab share frames (addr=%pa)!\n",
853 &addr);
efaf30a3
KRW
854 return -ENOMEM;
855 }
856 pfn = kcalloc(max_nr_gframes, sizeof(pfn[0]), GFP_KERNEL);
857 if (!pfn) {
858 xen_unmap(vaddr);
859 return -ENOMEM;
860 }
861 for (i = 0; i < max_nr_gframes; i++)
862 pfn[i] = PFN_DOWN(addr) + i;
863
864 xen_auto_xlat_grant_frames.vaddr = vaddr;
865 xen_auto_xlat_grant_frames.pfn = pfn;
866 xen_auto_xlat_grant_frames.count = max_nr_gframes;
867
868 return 0;
869}
870EXPORT_SYMBOL_GPL(gnttab_setup_auto_xlat_frames);
871
872void gnttab_free_auto_xlat_frames(void)
873{
874 if (!xen_auto_xlat_grant_frames.count)
875 return;
876 kfree(xen_auto_xlat_grant_frames.pfn);
877 xen_unmap(xen_auto_xlat_grant_frames.vaddr);
878
879 xen_auto_xlat_grant_frames.pfn = NULL;
880 xen_auto_xlat_grant_frames.count = 0;
881 xen_auto_xlat_grant_frames.vaddr = NULL;
882}
883EXPORT_SYMBOL_GPL(gnttab_free_auto_xlat_frames);
884
c571898f
ALC
885/* Handling of paged out grant targets (GNTST_eagain) */
886#define MAX_DELAY 256
887static inline void
888gnttab_retry_eagain_gop(unsigned int cmd, void *gop, int16_t *status,
889 const char *func)
890{
891 unsigned delay = 1;
892
893 do {
894 BUG_ON(HYPERVISOR_grant_table_op(cmd, gop, 1));
895 if (*status == GNTST_eagain)
896 msleep(delay++);
897 } while ((*status == GNTST_eagain) && (delay < MAX_DELAY));
898
899 if (delay >= MAX_DELAY) {
283c0972 900 pr_err("%s: %s eagain grant\n", func, current->comm);
c571898f
ALC
901 *status = GNTST_bad_page;
902 }
903}
904
905void gnttab_batch_map(struct gnttab_map_grant_ref *batch, unsigned count)
906{
907 struct gnttab_map_grant_ref *op;
908
909 if (HYPERVISOR_grant_table_op(GNTTABOP_map_grant_ref, batch, count))
910 BUG();
911 for (op = batch; op < batch + count; op++)
912 if (op->status == GNTST_eagain)
913 gnttab_retry_eagain_gop(GNTTABOP_map_grant_ref, op,
914 &op->status, __func__);
915}
916EXPORT_SYMBOL_GPL(gnttab_batch_map);
917
918void gnttab_batch_copy(struct gnttab_copy *batch, unsigned count)
919{
920 struct gnttab_copy *op;
921
922 if (HYPERVISOR_grant_table_op(GNTTABOP_copy, batch, count))
923 BUG();
924 for (op = batch; op < batch + count; op++)
925 if (op->status == GNTST_eagain)
926 gnttab_retry_eagain_gop(GNTTABOP_copy, op,
927 &op->status, __func__);
928}
929EXPORT_SYMBOL_GPL(gnttab_batch_copy);
930
08ece5bb 931int __gnttab_map_refs(struct gnttab_map_grant_ref *map_ops,
c123799a 932 struct gnttab_map_grant_ref *kmap_ops,
08ece5bb
ZK
933 struct page **pages, unsigned int count,
934 bool m2p_override)
289b777e
SS
935{
936 int i, ret;
f62805f1 937 bool lazy = false;
289b777e 938 pte_t *pte;
08ece5bb 939 unsigned long mfn, pfn;
289b777e 940
08ece5bb 941 BUG_ON(kmap_ops && !m2p_override);
289b777e 942 ret = HYPERVISOR_grant_table_op(GNTTABOP_map_grant_ref, map_ops, count);
87f1d40a
JF
943 if (ret)
944 return ret;
289b777e 945
c571898f
ALC
946 /* Retry eagain maps */
947 for (i = 0; i < count; i++)
948 if (map_ops[i].status == GNTST_eagain)
949 gnttab_retry_eagain_gop(GNTTABOP_map_grant_ref, map_ops + i,
950 &map_ops[i].status, __func__);
951
3d24bbd7
SS
952 /* this is basically a nop on x86 */
953 if (xen_feature(XENFEAT_auto_translated_physmap)) {
954 for (i = 0; i < count; i++) {
955 if (map_ops[i].status)
956 continue;
957 set_phys_to_machine(map_ops[i].host_addr >> PAGE_SHIFT,
958 map_ops[i].dev_bus_addr >> PAGE_SHIFT);
959 }
08ece5bb 960 return 0;
3d24bbd7 961 }
aab8f11a 962
08ece5bb
ZK
963 if (m2p_override &&
964 !in_interrupt() &&
965 paravirt_get_lazy_mode() == PARAVIRT_LAZY_NONE) {
f62805f1
SS
966 arch_enter_lazy_mmu_mode();
967 lazy = true;
968 }
969
289b777e 970 for (i = 0; i < count; i++) {
dc4972a4
IC
971 /* Do not add to override if the map failed. */
972 if (map_ops[i].status)
973 continue;
974
cf8d9163
KRW
975 if (map_ops[i].flags & GNTMAP_contains_pte) {
976 pte = (pte_t *) (mfn_to_virt(PFN_DOWN(map_ops[i].host_addr)) +
289b777e 977 (map_ops[i].host_addr & ~PAGE_MASK));
cf8d9163
KRW
978 mfn = pte_mfn(*pte);
979 } else {
7d17e84b 980 mfn = PFN_DOWN(map_ops[i].dev_bus_addr);
cf8d9163 981 }
08ece5bb
ZK
982 pfn = page_to_pfn(pages[i]);
983
984 WARN_ON(PagePrivate(pages[i]));
985 SetPagePrivate(pages[i]);
986 set_page_private(pages[i], mfn);
987
988 pages[i]->index = pfn_to_mfn(pfn);
989 if (unlikely(!set_phys_to_machine(pfn, FOREIGN_FRAME(mfn)))) {
990 ret = -ENOMEM;
991 goto out;
992 }
993 if (m2p_override)
994 ret = m2p_add_override(mfn, pages[i], kmap_ops ?
995 &kmap_ops[i] : NULL);
87f1d40a 996 if (ret)
14883a75 997 goto out;
289b777e
SS
998 }
999
14883a75 1000 out:
f62805f1
SS
1001 if (lazy)
1002 arch_leave_lazy_mmu_mode();
1003
289b777e
SS
1004 return ret;
1005}
08ece5bb
ZK
1006
1007int gnttab_map_refs(struct gnttab_map_grant_ref *map_ops,
1008 struct page **pages, unsigned int count)
1009{
1010 return __gnttab_map_refs(map_ops, NULL, pages, count, false);
1011}
289b777e
SS
1012EXPORT_SYMBOL_GPL(gnttab_map_refs);
1013
08ece5bb
ZK
1014int gnttab_map_refs_userspace(struct gnttab_map_grant_ref *map_ops,
1015 struct gnttab_map_grant_ref *kmap_ops,
1016 struct page **pages, unsigned int count)
1017{
1018 return __gnttab_map_refs(map_ops, kmap_ops, pages, count, true);
1019}
1020EXPORT_SYMBOL_GPL(gnttab_map_refs_userspace);
1021
1022int __gnttab_unmap_refs(struct gnttab_unmap_grant_ref *unmap_ops,
2fc136ee 1023 struct gnttab_map_grant_ref *kmap_ops,
08ece5bb
ZK
1024 struct page **pages, unsigned int count,
1025 bool m2p_override)
289b777e
SS
1026{
1027 int i, ret;
f62805f1 1028 bool lazy = false;
08ece5bb 1029 unsigned long pfn, mfn;
289b777e 1030
08ece5bb 1031 BUG_ON(kmap_ops && !m2p_override);
289b777e 1032 ret = HYPERVISOR_grant_table_op(GNTTABOP_unmap_grant_ref, unmap_ops, count);
87f1d40a
JF
1033 if (ret)
1034 return ret;
1035
3d24bbd7
SS
1036 /* this is basically a nop on x86 */
1037 if (xen_feature(XENFEAT_auto_translated_physmap)) {
1038 for (i = 0; i < count; i++) {
1039 set_phys_to_machine(unmap_ops[i].host_addr >> PAGE_SHIFT,
1040 INVALID_P2M_ENTRY);
1041 }
08ece5bb 1042 return 0;
3d24bbd7 1043 }
aab8f11a 1044
08ece5bb
ZK
1045 if (m2p_override &&
1046 !in_interrupt() &&
1047 paravirt_get_lazy_mode() == PARAVIRT_LAZY_NONE) {
f62805f1
SS
1048 arch_enter_lazy_mmu_mode();
1049 lazy = true;
1050 }
1051
87f1d40a 1052 for (i = 0; i < count; i++) {
08ece5bb
ZK
1053 pfn = page_to_pfn(pages[i]);
1054 mfn = get_phys_to_machine(pfn);
1055 if (mfn == INVALID_P2M_ENTRY || !(mfn & FOREIGN_FRAME_BIT)) {
1056 ret = -EINVAL;
1057 goto out;
1058 }
1059
1060 set_page_private(pages[i], INVALID_P2M_ENTRY);
1061 WARN_ON(!PagePrivate(pages[i]));
1062 ClearPagePrivate(pages[i]);
1063 set_phys_to_machine(pfn, pages[i]->index);
1064 if (m2p_override)
1065 ret = m2p_remove_override(pages[i],
1066 kmap_ops ?
1067 &kmap_ops[i] : NULL,
1068 mfn);
87f1d40a 1069 if (ret)
14883a75 1070 goto out;
87f1d40a 1071 }
289b777e 1072
14883a75 1073 out:
f62805f1
SS
1074 if (lazy)
1075 arch_leave_lazy_mmu_mode();
1076
289b777e
SS
1077 return ret;
1078}
08ece5bb
ZK
1079
1080int gnttab_unmap_refs(struct gnttab_unmap_grant_ref *map_ops,
1081 struct page **pages, unsigned int count)
1082{
1083 return __gnttab_unmap_refs(map_ops, NULL, pages, count, false);
1084}
289b777e
SS
1085EXPORT_SYMBOL_GPL(gnttab_unmap_refs);
1086
08ece5bb
ZK
1087int gnttab_unmap_refs_userspace(struct gnttab_unmap_grant_ref *map_ops,
1088 struct gnttab_map_grant_ref *kmap_ops,
1089 struct page **pages, unsigned int count)
1090{
1091 return __gnttab_unmap_refs(map_ops, kmap_ops, pages, count, true);
1092}
1093EXPORT_SYMBOL_GPL(gnttab_unmap_refs_userspace);
1094
85ff6acb
AL
1095static unsigned nr_status_frames(unsigned nr_grant_frames)
1096{
d0b4d64a
MW
1097 BUG_ON(grefs_per_grant_frame == 0);
1098 return (nr_grant_frames * grefs_per_grant_frame + SPP - 1) / SPP;
85ff6acb
AL
1099}
1100
ef32f892 1101static int gnttab_map_frames_v1(xen_pfn_t *frames, unsigned int nr_gframes)
0f9f5a95
AL
1102{
1103 int rc;
1104
1105 rc = arch_gnttab_map_shared(frames, nr_gframes,
1106 gnttab_max_grant_frames(),
1107 &gnttab_shared.addr);
1108 BUG_ON(rc);
1109
1110 return 0;
1111}
1112
1113static void gnttab_unmap_frames_v1(void)
1114{
85ff6acb
AL
1115 arch_gnttab_unmap(gnttab_shared.addr, nr_grant_frames);
1116}
1117
ef32f892 1118static int gnttab_map_frames_v2(xen_pfn_t *frames, unsigned int nr_gframes)
85ff6acb
AL
1119{
1120 uint64_t *sframes;
1121 unsigned int nr_sframes;
1122 struct gnttab_get_status_frames getframes;
1123 int rc;
1124
1125 nr_sframes = nr_status_frames(nr_gframes);
1126
1127 /* No need for kzalloc as it is initialized in following hypercall
1128 * GNTTABOP_get_status_frames.
1129 */
1130 sframes = kmalloc(nr_sframes * sizeof(uint64_t), GFP_ATOMIC);
1131 if (!sframes)
1132 return -ENOMEM;
1133
1134 getframes.dom = DOMID_SELF;
1135 getframes.nr_frames = nr_sframes;
1136 set_xen_guest_handle(getframes.frame_list, sframes);
1137
1138 rc = HYPERVISOR_grant_table_op(GNTTABOP_get_status_frames,
1139 &getframes, 1);
1140 if (rc == -ENOSYS) {
1141 kfree(sframes);
1142 return -ENOSYS;
1143 }
1144
1145 BUG_ON(rc || getframes.status);
1146
1147 rc = arch_gnttab_map_status(sframes, nr_sframes,
1148 nr_status_frames(gnttab_max_grant_frames()),
1149 &grstatus);
1150 BUG_ON(rc);
1151 kfree(sframes);
1152
1153 rc = arch_gnttab_map_shared(frames, nr_gframes,
1154 gnttab_max_grant_frames(),
1155 &gnttab_shared.addr);
1156 BUG_ON(rc);
1157
1158 return 0;
1159}
1160
1161static void gnttab_unmap_frames_v2(void)
1162{
1163 arch_gnttab_unmap(gnttab_shared.addr, nr_grant_frames);
1164 arch_gnttab_unmap(grstatus, nr_status_frames(nr_grant_frames));
0f9f5a95
AL
1165}
1166
ad9a8612
JF
1167static int gnttab_map(unsigned int start_idx, unsigned int end_idx)
1168{
1169 struct gnttab_setup_table setup;
ef32f892 1170 xen_pfn_t *frames;
ad9a8612
JF
1171 unsigned int nr_gframes = end_idx + 1;
1172 int rc;
1173
6926f6d6 1174 if (xen_feature(XENFEAT_auto_translated_physmap)) {
183d03cc
SS
1175 struct xen_add_to_physmap xatp;
1176 unsigned int i = end_idx;
1177 rc = 0;
efaf30a3 1178 BUG_ON(xen_auto_xlat_grant_frames.count < nr_gframes);
183d03cc
SS
1179 /*
1180 * Loop backwards, so that the first hypercall has the largest
1181 * index, ensuring that the table will grow only once.
1182 */
1183 do {
1184 xatp.domid = DOMID_SELF;
1185 xatp.idx = i;
1186 xatp.space = XENMAPSPACE_grant_table;
efaf30a3 1187 xatp.gpfn = xen_auto_xlat_grant_frames.pfn[i];
183d03cc
SS
1188 rc = HYPERVISOR_memory_op(XENMEM_add_to_physmap, &xatp);
1189 if (rc != 0) {
283c0972
JP
1190 pr_warn("grant table add_to_physmap failed, err=%d\n",
1191 rc);
183d03cc
SS
1192 break;
1193 }
1194 } while (i-- > start_idx);
1195
1196 return rc;
1197 }
1198
85ff6acb
AL
1199 /* No need for kzalloc as it is initialized in following hypercall
1200 * GNTTABOP_setup_table.
1201 */
ad9a8612
JF
1202 frames = kmalloc(nr_gframes * sizeof(unsigned long), GFP_ATOMIC);
1203 if (!frames)
1204 return -ENOMEM;
1205
1206 setup.dom = DOMID_SELF;
1207 setup.nr_frames = nr_gframes;
87e27cf6 1208 set_xen_guest_handle(setup.frame_list, frames);
ad9a8612
JF
1209
1210 rc = HYPERVISOR_grant_table_op(GNTTABOP_setup_table, &setup, 1);
1211 if (rc == -ENOSYS) {
1212 kfree(frames);
1213 return -ENOSYS;
1214 }
1215
1216 BUG_ON(rc || setup.status);
1217
0f9f5a95 1218 rc = gnttab_interface->map_frames(frames, nr_gframes);
ad9a8612
JF
1219
1220 kfree(frames);
1221
0f9f5a95
AL
1222 return rc;
1223}
1224
1225static struct gnttab_ops gnttab_v1_ops = {
1226 .map_frames = gnttab_map_frames_v1,
1227 .unmap_frames = gnttab_unmap_frames_v1,
1228 .update_entry = gnttab_update_entry_v1,
1229 .end_foreign_access_ref = gnttab_end_foreign_access_ref_v1,
1230 .end_foreign_transfer_ref = gnttab_end_foreign_transfer_ref_v1,
1231 .query_foreign_access = gnttab_query_foreign_access_v1,
1232};
1233
85ff6acb
AL
1234static struct gnttab_ops gnttab_v2_ops = {
1235 .map_frames = gnttab_map_frames_v2,
1236 .unmap_frames = gnttab_unmap_frames_v2,
1237 .update_entry = gnttab_update_entry_v2,
1238 .end_foreign_access_ref = gnttab_end_foreign_access_ref_v2,
1239 .end_foreign_transfer_ref = gnttab_end_foreign_transfer_ref_v2,
1240 .query_foreign_access = gnttab_query_foreign_access_v2,
6666754b 1241 .update_subpage_entry = gnttab_update_subpage_entry_v2,
9438ce9d 1242 .update_trans_entry = gnttab_update_trans_entry_v2,
85ff6acb
AL
1243};
1244
0f9f5a95
AL
1245static void gnttab_request_version(void)
1246{
85ff6acb
AL
1247 int rc;
1248 struct gnttab_set_version gsv;
1249
11c7ff17
KRW
1250 gsv.version = 1;
1251
85ff6acb 1252 rc = HYPERVISOR_grant_table_op(GNTTABOP_set_version, &gsv, 1);
69e8f430 1253 if (rc == 0 && gsv.version == 2) {
85ff6acb 1254 grant_table_version = 2;
d0b4d64a 1255 grefs_per_grant_frame = PAGE_SIZE / sizeof(union grant_entry_v2);
85ff6acb
AL
1256 gnttab_interface = &gnttab_v2_ops;
1257 } else if (grant_table_version == 2) {
1258 /*
1259 * If we've already used version 2 features,
1260 * but then suddenly discover that they're not
1261 * available (e.g. migrating to an older
1262 * version of Xen), almost unbounded badness
1263 * can happen.
1264 */
1265 panic("we need grant tables version 2, but only version 1 is available");
1266 } else {
1267 grant_table_version = 1;
d0b4d64a 1268 grefs_per_grant_frame = PAGE_SIZE / sizeof(struct grant_entry_v1);
85ff6acb
AL
1269 gnttab_interface = &gnttab_v1_ops;
1270 }
283c0972 1271 pr_info("Grant tables using version %d layout\n", grant_table_version);
ad9a8612
JF
1272}
1273
d0b4d64a 1274static int gnttab_setup(void)
ad9a8612 1275{
183d03cc
SS
1276 unsigned int max_nr_gframes;
1277
1278 max_nr_gframes = gnttab_max_grant_frames();
1279 if (max_nr_gframes < nr_grant_frames)
ad9a8612 1280 return -ENOSYS;
183d03cc 1281
45684753 1282 if (xen_feature(XENFEAT_auto_translated_physmap) && gnttab_shared.addr == NULL) {
efaf30a3 1283 gnttab_shared.addr = xen_auto_xlat_grant_frames.vaddr;
0f9f5a95 1284 if (gnttab_shared.addr == NULL) {
efaf30a3
KRW
1285 pr_warn("gnttab share frames (addr=0x%08lx) is not mapped!\n",
1286 (unsigned long)xen_auto_xlat_grant_frames.vaddr);
183d03cc
SS
1287 return -ENOMEM;
1288 }
1289 }
45684753 1290 return gnttab_map(0, nr_grant_frames - 1);
ad9a8612
JF
1291}
1292
d0b4d64a
MW
1293int gnttab_resume(void)
1294{
1295 gnttab_request_version();
1296 return gnttab_setup();
1297}
1298
0e91398f 1299int gnttab_suspend(void)
ad9a8612 1300{
0f9f5a95 1301 gnttab_interface->unmap_frames();
ad9a8612
JF
1302 return 0;
1303}
1304
1305static int gnttab_expand(unsigned int req_entries)
1306{
1307 int rc;
1308 unsigned int cur, extra;
1309
d0b4d64a 1310 BUG_ON(grefs_per_grant_frame == 0);
ad9a8612 1311 cur = nr_grant_frames;
d0b4d64a
MW
1312 extra = ((req_entries + (grefs_per_grant_frame-1)) /
1313 grefs_per_grant_frame);
183d03cc 1314 if (cur + extra > gnttab_max_grant_frames())
ad9a8612
JF
1315 return -ENOSPC;
1316
1317 rc = gnttab_map(cur, cur + extra - 1);
1318 if (rc == 0)
1319 rc = grow_gnttab_list(extra);
1320
1321 return rc;
1322}
1323
183d03cc 1324int gnttab_init(void)
ad9a8612
JF
1325{
1326 int i;
bbc60c18 1327 unsigned int max_nr_glist_frames, nr_glist_frames;
ad9a8612 1328 unsigned int nr_init_grefs;
6b5e7d9e 1329 int ret;
ad9a8612 1330
d0b4d64a 1331 gnttab_request_version();
ad9a8612 1332 nr_grant_frames = 1;
ad9a8612
JF
1333
1334 /* Determine the maximum number of frames required for the
1335 * grant reference free list on the current hypervisor.
1336 */
d0b4d64a 1337 BUG_ON(grefs_per_grant_frame == 0);
7f256020 1338 max_nr_glist_frames = (gnttab_max_grant_frames() *
d0b4d64a 1339 grefs_per_grant_frame / RPP);
ad9a8612
JF
1340
1341 gnttab_list = kmalloc(max_nr_glist_frames * sizeof(grant_ref_t *),
1342 GFP_KERNEL);
1343 if (gnttab_list == NULL)
1344 return -ENOMEM;
1345
d0b4d64a 1346 nr_glist_frames = (nr_grant_frames * grefs_per_grant_frame + RPP - 1) / RPP;
bbc60c18 1347 for (i = 0; i < nr_glist_frames; i++) {
ad9a8612 1348 gnttab_list[i] = (grant_ref_t *)__get_free_page(GFP_KERNEL);
6b5e7d9e
JL
1349 if (gnttab_list[i] == NULL) {
1350 ret = -ENOMEM;
ad9a8612 1351 goto ini_nomem;
6b5e7d9e 1352 }
ad9a8612
JF
1353 }
1354
d0b4d64a 1355 if (gnttab_setup() < 0) {
6b5e7d9e
JL
1356 ret = -ENODEV;
1357 goto ini_nomem;
1358 }
ad9a8612 1359
d0b4d64a 1360 nr_init_grefs = nr_grant_frames * grefs_per_grant_frame;
ad9a8612
JF
1361
1362 for (i = NR_RESERVED_ENTRIES; i < nr_init_grefs - 1; i++)
1363 gnttab_entry(i) = i + 1;
1364
1365 gnttab_entry(nr_init_grefs - 1) = GNTTAB_LIST_END;
1366 gnttab_free_count = nr_init_grefs - NR_RESERVED_ENTRIES;
1367 gnttab_free_head = NR_RESERVED_ENTRIES;
1368
1369 printk("Grant table initialized\n");
1370 return 0;
1371
1372 ini_nomem:
1373 for (i--; i >= 0; i--)
1374 free_page((unsigned long)gnttab_list[i]);
1375 kfree(gnttab_list);
6b5e7d9e 1376 return ret;
ad9a8612 1377}
183d03cc
SS
1378EXPORT_SYMBOL_GPL(gnttab_init);
1379
345a5255 1380static int __gnttab_init(void)
183d03cc
SS
1381{
1382 /* Delay grant-table initialization in the PV on HVM case */
1383 if (xen_hvm_domain())
1384 return 0;
1385
1386 if (!xen_pv_domain())
1387 return -ENODEV;
1388
1389 return gnttab_init();
1390}
6926f6d6
KRW
1391/* Starts after core_initcall so that xen_pvh_gnttab_setup can be called
1392 * beforehand to initialize xen_auto_xlat_grant_frames. */
1393core_initcall_sync(__gnttab_init);