]>
Commit | Line | Data |
---|---|---|
54738c09 DG |
1 | /* |
2 | * This program is free software; you can redistribute it and/or modify | |
3 | * it under the terms of the GNU General Public License, version 2, as | |
4 | * published by the Free Software Foundation. | |
5 | * | |
6 | * This program is distributed in the hope that it will be useful, | |
7 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
8 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
9 | * GNU General Public License for more details. | |
10 | * | |
11 | * You should have received a copy of the GNU General Public License | |
12 | * along with this program; if not, write to the Free Software | |
13 | * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. | |
14 | * | |
15 | * Copyright 2010 Paul Mackerras, IBM Corp. <paulus@au1.ibm.com> | |
16 | * Copyright 2011 David Gibson, IBM Corporation <dwg@au1.ibm.com> | |
d3695aa4 | 17 | * Copyright 2016 Alexey Kardashevskiy, IBM Corporation <aik@au1.ibm.com> |
54738c09 DG |
18 | */ |
19 | ||
20 | #include <linux/types.h> | |
21 | #include <linux/string.h> | |
22 | #include <linux/kvm.h> | |
23 | #include <linux/kvm_host.h> | |
24 | #include <linux/highmem.h> | |
25 | #include <linux/gfp.h> | |
26 | #include <linux/slab.h> | |
27 | #include <linux/hugetlb.h> | |
28 | #include <linux/list.h> | |
29 | ||
30 | #include <asm/tlbflush.h> | |
31 | #include <asm/kvm_ppc.h> | |
32 | #include <asm/kvm_book3s.h> | |
f64e8084 | 33 | #include <asm/book3s/64/mmu-hash.h> |
d3695aa4 | 34 | #include <asm/mmu_context.h> |
54738c09 DG |
35 | #include <asm/hvcall.h> |
36 | #include <asm/synch.h> | |
37 | #include <asm/ppc-opcode.h> | |
38 | #include <asm/kvm_host.h> | |
39 | #include <asm/udbg.h> | |
fcbb2ce6 | 40 | #include <asm/iommu.h> |
5ee7af18 | 41 | #include <asm/tce.h> |
54738c09 DG |
42 | |
43 | #define TCES_PER_PAGE (PAGE_SIZE / sizeof(u64)) | |
44 | ||
fcbb2ce6 AK |
45 | /* |
46 | * Finds a TCE table descriptor by LIOBN. | |
47 | * | |
48 | * WARNING: This will be called in real or virtual mode on HV KVM and virtual | |
49 | * mode on PR KVM | |
50 | */ | |
69e0373c | 51 | struct kvmppc_spapr_tce_table *kvmppc_find_table(struct kvm *kvm, |
fcbb2ce6 AK |
52 | unsigned long liobn) |
53 | { | |
fcbb2ce6 AK |
54 | struct kvmppc_spapr_tce_table *stt; |
55 | ||
366baf28 | 56 | list_for_each_entry_lockless(stt, &kvm->arch.spapr_tce_tables, list) |
fcbb2ce6 AK |
57 | if (stt->liobn == liobn) |
58 | return stt; | |
59 | ||
60 | return NULL; | |
61 | } | |
d3695aa4 | 62 | EXPORT_SYMBOL_GPL(kvmppc_find_table); |
fcbb2ce6 AK |
63 | |
64 | /* | |
65 | * Validates IO address. | |
66 | * | |
67 | * WARNING: This will be called in real-mode on HV KVM and virtual | |
68 | * mode on PR KVM | |
69 | */ | |
5ee7af18 | 70 | long kvmppc_ioba_validate(struct kvmppc_spapr_tce_table *stt, |
fcbb2ce6 AK |
71 | unsigned long ioba, unsigned long npages) |
72 | { | |
fe26e527 AK |
73 | unsigned long mask = (1ULL << stt->page_shift) - 1; |
74 | unsigned long idx = ioba >> stt->page_shift; | |
fcbb2ce6 | 75 | |
14f853f1 AK |
76 | if ((ioba & mask) || (idx < stt->offset) || |
77 | (idx - stt->offset + npages > stt->size) || | |
78 | (idx + npages < idx)) | |
fcbb2ce6 AK |
79 | return H_PARAMETER; |
80 | ||
81 | return H_SUCCESS; | |
82 | } | |
5ee7af18 AK |
83 | EXPORT_SYMBOL_GPL(kvmppc_ioba_validate); |
84 | ||
85 | /* | |
86 | * Validates TCE address. | |
87 | * At the moment flags and page mask are validated. | |
88 | * As the host kernel does not access those addresses (just puts them | |
89 | * to the table and user space is supposed to process them), we can skip | |
90 | * checking other things (such as TCE is a guest RAM address or the page | |
91 | * was actually allocated). | |
92 | * | |
93 | * WARNING: This will be called in real-mode on HV KVM and virtual | |
94 | * mode on PR KVM | |
95 | */ | |
96 | long kvmppc_tce_validate(struct kvmppc_spapr_tce_table *stt, unsigned long tce) | |
97 | { | |
fe26e527 AK |
98 | unsigned long page_mask = ~((1ULL << stt->page_shift) - 1); |
99 | unsigned long mask = ~(page_mask | TCE_PCI_WRITE | TCE_PCI_READ); | |
5ee7af18 AK |
100 | |
101 | if (tce & mask) | |
102 | return H_PARAMETER; | |
103 | ||
104 | return H_SUCCESS; | |
105 | } | |
106 | EXPORT_SYMBOL_GPL(kvmppc_tce_validate); | |
107 | ||
108 | /* Note on the use of page_address() in real mode, | |
109 | * | |
110 | * It is safe to use page_address() in real mode on ppc64 because | |
111 | * page_address() is always defined as lowmem_page_address() | |
112 | * which returns __va(PFN_PHYS(page_to_pfn(page))) which is arithmetic | |
113 | * operation and does not access page struct. | |
114 | * | |
115 | * Theoretically page_address() could be defined different | |
116 | * but either WANT_PAGE_VIRTUAL or HASHED_PAGE_VIRTUAL | |
117 | * would have to be enabled. | |
118 | * WANT_PAGE_VIRTUAL is never enabled on ppc32/ppc64, | |
119 | * HASHED_PAGE_VIRTUAL could be enabled for ppc32 only and only | |
120 | * if CONFIG_HIGHMEM is defined. As CONFIG_SPARSEMEM_VMEMMAP | |
121 | * is not expected to be enabled on ppc32, page_address() | |
122 | * is safe for ppc32 as well. | |
123 | * | |
124 | * WARNING: This will be called in real-mode on HV KVM and virtual | |
125 | * mode on PR KVM | |
126 | */ | |
127 | static u64 *kvmppc_page_address(struct page *page) | |
128 | { | |
129 | #if defined(HASHED_PAGE_VIRTUAL) || defined(WANT_PAGE_VIRTUAL) | |
130 | #error TODO: fix to avoid page_address() here | |
131 | #endif | |
132 | return (u64 *) page_address(page); | |
133 | } | |
134 | ||
135 | /* | |
136 | * Handles TCE requests for emulated devices. | |
137 | * Puts guest TCE values to the table and expects user space to convert them. | |
138 | * Called in both real and virtual modes. | |
139 | * Cannot fail so kvmppc_tce_validate must be called before it. | |
140 | * | |
141 | * WARNING: This will be called in real-mode on HV KVM and virtual | |
142 | * mode on PR KVM | |
143 | */ | |
144 | void kvmppc_tce_put(struct kvmppc_spapr_tce_table *stt, | |
145 | unsigned long idx, unsigned long tce) | |
146 | { | |
147 | struct page *page; | |
148 | u64 *tbl; | |
149 | ||
14f853f1 | 150 | idx -= stt->offset; |
5ee7af18 AK |
151 | page = stt->pages[idx / TCES_PER_PAGE]; |
152 | tbl = kvmppc_page_address(page); | |
153 | ||
154 | tbl[idx % TCES_PER_PAGE] = tce; | |
155 | } | |
156 | EXPORT_SYMBOL_GPL(kvmppc_tce_put); | |
fcbb2ce6 | 157 | |
d3695aa4 AK |
158 | long kvmppc_gpa_to_ua(struct kvm *kvm, unsigned long gpa, |
159 | unsigned long *ua, unsigned long **prmap) | |
160 | { | |
161 | unsigned long gfn = gpa >> PAGE_SHIFT; | |
162 | struct kvm_memory_slot *memslot; | |
163 | ||
164 | memslot = search_memslots(kvm_memslots(kvm), gfn); | |
165 | if (!memslot) | |
166 | return -EINVAL; | |
167 | ||
168 | *ua = __gfn_to_hva_memslot(memslot, gfn) | | |
169 | (gpa & ~(PAGE_MASK | TCE_PCI_READ | TCE_PCI_WRITE)); | |
170 | ||
171 | #ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE | |
172 | if (prmap) | |
173 | *prmap = &memslot->arch.rmap[gfn - memslot->base_gfn]; | |
174 | #endif | |
175 | ||
176 | return 0; | |
177 | } | |
178 | EXPORT_SYMBOL_GPL(kvmppc_gpa_to_ua); | |
179 | ||
180 | #ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE | |
31217db7 AK |
181 | long kvmppc_rm_h_put_tce(struct kvm_vcpu *vcpu, unsigned long liobn, |
182 | unsigned long ioba, unsigned long tce) | |
54738c09 | 183 | { |
69e0373c | 184 | struct kvmppc_spapr_tce_table *stt; |
fcbb2ce6 | 185 | long ret; |
54738c09 DG |
186 | |
187 | /* udbg_printf("H_PUT_TCE(): liobn=0x%lx ioba=0x%lx, tce=0x%lx\n", */ | |
188 | /* liobn, ioba, tce); */ | |
189 | ||
69e0373c | 190 | stt = kvmppc_find_table(vcpu->kvm, liobn); |
fcbb2ce6 AK |
191 | if (!stt) |
192 | return H_TOO_HARD; | |
193 | ||
194 | ret = kvmppc_ioba_validate(stt, ioba, 1); | |
195 | if (ret != H_SUCCESS) | |
196 | return ret; | |
197 | ||
5ee7af18 AK |
198 | ret = kvmppc_tce_validate(stt, tce); |
199 | if (ret != H_SUCCESS) | |
200 | return ret; | |
fcbb2ce6 | 201 | |
fe26e527 | 202 | kvmppc_tce_put(stt, ioba >> stt->page_shift, tce); |
fcbb2ce6 AK |
203 | |
204 | return H_SUCCESS; | |
54738c09 | 205 | } |
69e9fbb2 | 206 | |
d3695aa4 AK |
207 | static long kvmppc_rm_ua_to_hpa(struct kvm_vcpu *vcpu, |
208 | unsigned long ua, unsigned long *phpa) | |
209 | { | |
210 | pte_t *ptep, pte; | |
211 | unsigned shift = 0; | |
212 | ||
213 | ptep = __find_linux_pte_or_hugepte(vcpu->arch.pgdir, ua, NULL, &shift); | |
214 | if (!ptep || !pte_present(*ptep)) | |
215 | return -ENXIO; | |
216 | pte = *ptep; | |
217 | ||
218 | if (!shift) | |
219 | shift = PAGE_SHIFT; | |
220 | ||
221 | /* Avoid handling anything potentially complicated in realmode */ | |
222 | if (shift > PAGE_SHIFT) | |
223 | return -EAGAIN; | |
224 | ||
225 | if (!pte_young(pte)) | |
226 | return -EAGAIN; | |
227 | ||
228 | *phpa = (pte_pfn(pte) << PAGE_SHIFT) | (ua & ((1ULL << shift) - 1)) | | |
229 | (ua & ~PAGE_MASK); | |
230 | ||
231 | return 0; | |
232 | } | |
233 | ||
234 | long kvmppc_rm_h_put_tce_indirect(struct kvm_vcpu *vcpu, | |
235 | unsigned long liobn, unsigned long ioba, | |
236 | unsigned long tce_list, unsigned long npages) | |
237 | { | |
238 | struct kvmppc_spapr_tce_table *stt; | |
239 | long i, ret = H_SUCCESS; | |
240 | unsigned long tces, entry, ua = 0; | |
241 | unsigned long *rmap = NULL; | |
242 | ||
69e0373c | 243 | stt = kvmppc_find_table(vcpu->kvm, liobn); |
d3695aa4 AK |
244 | if (!stt) |
245 | return H_TOO_HARD; | |
246 | ||
fe26e527 | 247 | entry = ioba >> stt->page_shift; |
d3695aa4 AK |
248 | /* |
249 | * The spec says that the maximum size of the list is 512 TCEs | |
250 | * so the whole table addressed resides in 4K page | |
251 | */ | |
252 | if (npages > 512) | |
253 | return H_PARAMETER; | |
254 | ||
255 | if (tce_list & (SZ_4K - 1)) | |
256 | return H_PARAMETER; | |
257 | ||
258 | ret = kvmppc_ioba_validate(stt, ioba, npages); | |
259 | if (ret != H_SUCCESS) | |
260 | return ret; | |
261 | ||
262 | if (kvmppc_gpa_to_ua(vcpu->kvm, tce_list, &ua, &rmap)) | |
263 | return H_TOO_HARD; | |
264 | ||
265 | rmap = (void *) vmalloc_to_phys(rmap); | |
266 | ||
267 | /* | |
268 | * Synchronize with the MMU notifier callbacks in | |
269 | * book3s_64_mmu_hv.c (kvm_unmap_hva_hv etc.). | |
270 | * While we have the rmap lock, code running on other CPUs | |
271 | * cannot finish unmapping the host real page that backs | |
272 | * this guest real page, so we are OK to access the host | |
273 | * real page. | |
274 | */ | |
275 | lock_rmap(rmap); | |
276 | if (kvmppc_rm_ua_to_hpa(vcpu, ua, &tces)) { | |
277 | ret = H_TOO_HARD; | |
278 | goto unlock_exit; | |
279 | } | |
280 | ||
281 | for (i = 0; i < npages; ++i) { | |
282 | unsigned long tce = be64_to_cpu(((u64 *)tces)[i]); | |
283 | ||
284 | ret = kvmppc_tce_validate(stt, tce); | |
285 | if (ret != H_SUCCESS) | |
286 | goto unlock_exit; | |
287 | ||
288 | kvmppc_tce_put(stt, entry + i, tce); | |
289 | } | |
290 | ||
291 | unlock_exit: | |
292 | unlock_rmap(rmap); | |
293 | ||
294 | return ret; | |
295 | } | |
296 | ||
31217db7 | 297 | long kvmppc_rm_h_stuff_tce(struct kvm_vcpu *vcpu, |
d3695aa4 AK |
298 | unsigned long liobn, unsigned long ioba, |
299 | unsigned long tce_value, unsigned long npages) | |
300 | { | |
301 | struct kvmppc_spapr_tce_table *stt; | |
302 | long i, ret; | |
303 | ||
69e0373c | 304 | stt = kvmppc_find_table(vcpu->kvm, liobn); |
d3695aa4 AK |
305 | if (!stt) |
306 | return H_TOO_HARD; | |
307 | ||
308 | ret = kvmppc_ioba_validate(stt, ioba, npages); | |
309 | if (ret != H_SUCCESS) | |
310 | return ret; | |
311 | ||
312 | /* Check permission bits only to allow userspace poison TCE for debug */ | |
313 | if (tce_value & (TCE_PCI_WRITE | TCE_PCI_READ)) | |
314 | return H_PARAMETER; | |
315 | ||
fe26e527 AK |
316 | for (i = 0; i < npages; ++i, ioba += (1ULL << stt->page_shift)) |
317 | kvmppc_tce_put(stt, ioba >> stt->page_shift, tce_value); | |
d3695aa4 AK |
318 | |
319 | return H_SUCCESS; | |
320 | } | |
d3695aa4 | 321 | |
69e9fbb2 LD |
322 | long kvmppc_h_get_tce(struct kvm_vcpu *vcpu, unsigned long liobn, |
323 | unsigned long ioba) | |
324 | { | |
69e0373c | 325 | struct kvmppc_spapr_tce_table *stt; |
fcbb2ce6 AK |
326 | long ret; |
327 | unsigned long idx; | |
328 | struct page *page; | |
329 | u64 *tbl; | |
69e9fbb2 | 330 | |
69e0373c | 331 | stt = kvmppc_find_table(vcpu->kvm, liobn); |
fcbb2ce6 AK |
332 | if (!stt) |
333 | return H_TOO_HARD; | |
69e9fbb2 | 334 | |
fcbb2ce6 AK |
335 | ret = kvmppc_ioba_validate(stt, ioba, 1); |
336 | if (ret != H_SUCCESS) | |
337 | return ret; | |
69e9fbb2 | 338 | |
14f853f1 | 339 | idx = (ioba >> stt->page_shift) - stt->offset; |
fcbb2ce6 AK |
340 | page = stt->pages[idx / TCES_PER_PAGE]; |
341 | tbl = (u64 *)page_address(page); | |
69e9fbb2 | 342 | |
fcbb2ce6 | 343 | vcpu->arch.gpr[4] = tbl[idx % TCES_PER_PAGE]; |
69e9fbb2 | 344 | |
fcbb2ce6 | 345 | return H_SUCCESS; |
69e9fbb2 LD |
346 | } |
347 | EXPORT_SYMBOL_GPL(kvmppc_h_get_tce); | |
d3695aa4 AK |
348 | |
349 | #endif /* KVM_BOOK3S_HV_POSSIBLE */ |