blob: 7a57ea49172d503f962b4b8c85bbaac73447788f [file] [log] [blame]
Paul Mackerrasa8606e22011-06-29 00:22:05 +00001/*
2 * This program is free software; you can redistribute it and/or modify
3 * it under the terms of the GNU General Public License, version 2, as
4 * published by the Free Software Foundation.
5 *
6 * Copyright 2010-2011 Paul Mackerras, IBM Corp. <paulus@au1.ibm.com>
7 */
8
9#include <linux/types.h>
10#include <linux/string.h>
11#include <linux/kvm.h>
12#include <linux/kvm_host.h>
13#include <linux/hugetlb.h>
Paul Mackerrasc77162d2011-12-12 12:31:00 +000014#include <linux/module.h>
Paul Mackerrasa8606e22011-06-29 00:22:05 +000015
16#include <asm/tlbflush.h>
17#include <asm/kvm_ppc.h>
18#include <asm/kvm_book3s.h>
19#include <asm/mmu-hash64.h>
20#include <asm/hvcall.h>
21#include <asm/synch.h>
22#include <asm/ppc-opcode.h>
23
Paul Mackerras8936dda2011-12-12 12:27:39 +000024/* Translate address of a vmalloc'd thing to a linear map address */
25static void *real_vmalloc_addr(void *x)
26{
27 unsigned long addr = (unsigned long) x;
28 pte_t *p;
29
30 p = find_linux_pte(swapper_pg_dir, addr);
31 if (!p || !pte_present(*p))
32 return NULL;
33 /* assume we don't have huge pages in vmalloc space... */
34 addr = (pte_pfn(*p) << PAGE_SHIFT) | (addr & ~PAGE_MASK);
35 return __va(addr);
36}
Paul Mackerrasa8606e22011-06-29 00:22:05 +000037
Paul Mackerras06ce2c62011-12-12 12:33:07 +000038/*
39 * Add this HPTE into the chain for the real page.
40 * Must be called with the chain locked; it unlocks the chain.
41 */
Paul Mackerras342d3db2011-12-12 12:38:05 +000042void kvmppc_add_revmap_chain(struct kvm *kvm, struct revmap_entry *rev,
Paul Mackerras06ce2c62011-12-12 12:33:07 +000043 unsigned long *rmap, long pte_index, int realmode)
44{
45 struct revmap_entry *head, *tail;
46 unsigned long i;
47
48 if (*rmap & KVMPPC_RMAP_PRESENT) {
49 i = *rmap & KVMPPC_RMAP_INDEX;
50 head = &kvm->arch.revmap[i];
51 if (realmode)
52 head = real_vmalloc_addr(head);
53 tail = &kvm->arch.revmap[head->back];
54 if (realmode)
55 tail = real_vmalloc_addr(tail);
56 rev->forw = i;
57 rev->back = head->back;
58 tail->forw = pte_index;
59 head->back = pte_index;
60 } else {
61 rev->forw = rev->back = pte_index;
Paul Mackerras4879f242012-11-19 23:01:34 +000062 *rmap = (*rmap & ~KVMPPC_RMAP_INDEX) |
63 pte_index | KVMPPC_RMAP_PRESENT;
Paul Mackerras06ce2c62011-12-12 12:33:07 +000064 }
Paul Mackerras4879f242012-11-19 23:01:34 +000065 unlock_rmap(rmap);
Paul Mackerras06ce2c62011-12-12 12:33:07 +000066}
Paul Mackerras342d3db2011-12-12 12:38:05 +000067EXPORT_SYMBOL_GPL(kvmppc_add_revmap_chain);
Paul Mackerras06ce2c62011-12-12 12:33:07 +000068
Paul Mackerras44e5f6b2012-11-19 22:52:49 +000069/*
70 * Note modification of an HPTE; set the HPTE modified bit
71 * if anyone is interested.
72 */
73static inline void note_hpte_modification(struct kvm *kvm,
74 struct revmap_entry *rev)
75{
76 if (atomic_read(&kvm->arch.hpte_mod_interest))
77 rev->guest_rpte |= HPTE_GR_MODIFIED;
78}
79
Paul Mackerras06ce2c62011-12-12 12:33:07 +000080/* Remove this HPTE from the chain for a real page */
81static void remove_revmap_chain(struct kvm *kvm, long pte_index,
Paul Mackerrasbad3b502011-12-15 02:02:02 +000082 struct revmap_entry *rev,
83 unsigned long hpte_v, unsigned long hpte_r)
Paul Mackerras06ce2c62011-12-12 12:33:07 +000084{
Paul Mackerrasbad3b502011-12-15 02:02:02 +000085 struct revmap_entry *next, *prev;
Paul Mackerras06ce2c62011-12-12 12:33:07 +000086 unsigned long gfn, ptel, head;
87 struct kvm_memory_slot *memslot;
88 unsigned long *rmap;
Paul Mackerrasbad3b502011-12-15 02:02:02 +000089 unsigned long rcbits;
Paul Mackerras06ce2c62011-12-12 12:33:07 +000090
Paul Mackerrasbad3b502011-12-15 02:02:02 +000091 rcbits = hpte_r & (HPTE_R_R | HPTE_R_C);
92 ptel = rev->guest_rpte |= rcbits;
Paul Mackerras06ce2c62011-12-12 12:33:07 +000093 gfn = hpte_rpn(ptel, hpte_page_size(hpte_v, ptel));
Paul Mackerras9d4cba72012-01-12 20:09:51 +000094 memslot = __gfn_to_memslot(kvm_memslots(kvm), gfn);
Paul Mackerrasdfe49db2012-09-11 13:28:18 +000095 if (!memslot)
Paul Mackerras06ce2c62011-12-12 12:33:07 +000096 return;
97
Takuya Yoshikawad89cc612012-08-01 18:03:28 +090098 rmap = real_vmalloc_addr(&memslot->arch.rmap[gfn - memslot->base_gfn]);
Paul Mackerras06ce2c62011-12-12 12:33:07 +000099 lock_rmap(rmap);
100
101 head = *rmap & KVMPPC_RMAP_INDEX;
102 next = real_vmalloc_addr(&kvm->arch.revmap[rev->forw]);
103 prev = real_vmalloc_addr(&kvm->arch.revmap[rev->back]);
104 next->back = rev->back;
105 prev->forw = rev->forw;
106 if (head == pte_index) {
107 head = rev->forw;
108 if (head == pte_index)
109 *rmap &= ~(KVMPPC_RMAP_PRESENT | KVMPPC_RMAP_INDEX);
110 else
111 *rmap = (*rmap & ~KVMPPC_RMAP_INDEX) | head;
112 }
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000113 *rmap |= rcbits << KVMPPC_RMAP_RC_SHIFT;
Paul Mackerras06ce2c62011-12-12 12:33:07 +0000114 unlock_rmap(rmap);
115}
116
Paul Mackerras7ed661b2012-11-13 18:31:32 +0000117static pte_t lookup_linux_pte(pgd_t *pgdir, unsigned long hva,
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000118 int writing, unsigned long *pte_sizep)
Paul Mackerras342d3db2011-12-12 12:38:05 +0000119{
120 pte_t *ptep;
121 unsigned long ps = *pte_sizep;
122 unsigned int shift;
123
Paul Mackerras7ed661b2012-11-13 18:31:32 +0000124 ptep = find_linux_pte_or_hugepte(pgdir, hva, &shift);
Paul Mackerras342d3db2011-12-12 12:38:05 +0000125 if (!ptep)
126 return __pte(0);
127 if (shift)
128 *pte_sizep = 1ul << shift;
129 else
130 *pte_sizep = PAGE_SIZE;
131 if (ps > *pte_sizep)
132 return __pte(0);
133 if (!pte_present(*ptep))
134 return __pte(0);
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000135 return kvmppc_read_update_linux_pte(ptep, writing);
Paul Mackerras342d3db2011-12-12 12:38:05 +0000136}
137
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000138static inline void unlock_hpte(unsigned long *hpte, unsigned long hpte_v)
139{
140 asm volatile(PPC_RELEASE_BARRIER "" : : : "memory");
141 hpte[0] = hpte_v;
142}
143
Paul Mackerras7ed661b2012-11-13 18:31:32 +0000144long kvmppc_do_h_enter(struct kvm *kvm, unsigned long flags,
145 long pte_index, unsigned long pteh, unsigned long ptel,
146 pgd_t *pgdir, bool realmode, unsigned long *pte_idx_ret)
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000147{
Paul Mackerrasc77162d2011-12-12 12:31:00 +0000148 unsigned long i, pa, gpa, gfn, psize;
Paul Mackerras342d3db2011-12-12 12:38:05 +0000149 unsigned long slot_fn, hva;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000150 unsigned long *hpte;
Paul Mackerras8936dda2011-12-12 12:27:39 +0000151 struct revmap_entry *rev;
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000152 unsigned long g_ptel;
Paul Mackerrasb2b2f162011-12-12 12:28:21 +0000153 struct kvm_memory_slot *memslot;
Paul Mackerrasc77162d2011-12-12 12:31:00 +0000154 unsigned long *physp, pte_size;
Paul Mackerras9d0ef5ea2011-12-12 12:32:27 +0000155 unsigned long is_io;
Paul Mackerras06ce2c62011-12-12 12:33:07 +0000156 unsigned long *rmap;
Paul Mackerras342d3db2011-12-12 12:38:05 +0000157 pte_t pte;
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000158 unsigned int writing;
Paul Mackerras342d3db2011-12-12 12:38:05 +0000159 unsigned long mmu_seq;
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000160 unsigned long rcbits;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000161
Paul Mackerrasc77162d2011-12-12 12:31:00 +0000162 psize = hpte_page_size(pteh, ptel);
163 if (!psize)
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000164 return H_PARAMETER;
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000165 writing = hpte_is_writable(ptel);
Paul Mackerras697d3892011-12-12 12:36:37 +0000166 pteh &= ~(HPTE_V_HVLOCK | HPTE_V_ABSENT | HPTE_V_VALID);
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000167 ptel &= ~HPTE_GR_RESERVED;
168 g_ptel = ptel;
Paul Mackerrasb2b2f162011-12-12 12:28:21 +0000169
Paul Mackerras342d3db2011-12-12 12:38:05 +0000170 /* used later to detect if we might have been invalidated */
171 mmu_seq = kvm->mmu_notifier_seq;
172 smp_rmb();
173
Paul Mackerrasc77162d2011-12-12 12:31:00 +0000174 /* Find the memslot (if any) for this address */
175 gpa = (ptel & HPTE_R_RPN) & ~(psize - 1);
176 gfn = gpa >> PAGE_SHIFT;
Paul Mackerras9d4cba72012-01-12 20:09:51 +0000177 memslot = __gfn_to_memslot(kvm_memslots(kvm), gfn);
Paul Mackerras697d3892011-12-12 12:36:37 +0000178 pa = 0;
Paul Mackerras342d3db2011-12-12 12:38:05 +0000179 is_io = ~0ul;
Paul Mackerras697d3892011-12-12 12:36:37 +0000180 rmap = NULL;
181 if (!(memslot && !(memslot->flags & KVM_MEMSLOT_INVALID))) {
182 /* PPC970 can't do emulated MMIO */
183 if (!cpu_has_feature(CPU_FTR_ARCH_206))
184 return H_PARAMETER;
185 /* Emulated MMIO - mark this with key=31 */
186 pteh |= HPTE_V_ABSENT;
187 ptel |= HPTE_R_KEY_HI | HPTE_R_KEY_LO;
188 goto do_insert;
189 }
Paul Mackerrasda9d1d72011-12-12 12:31:41 +0000190
191 /* Check if the requested page fits entirely in the memslot. */
192 if (!slot_is_aligned(memslot, psize))
193 return H_PARAMETER;
Paul Mackerrasc77162d2011-12-12 12:31:00 +0000194 slot_fn = gfn - memslot->base_gfn;
Takuya Yoshikawad89cc612012-08-01 18:03:28 +0900195 rmap = &memslot->arch.rmap[slot_fn];
Paul Mackerrasc77162d2011-12-12 12:31:00 +0000196
Paul Mackerras342d3db2011-12-12 12:38:05 +0000197 if (!kvm->arch.using_mmu_notifiers) {
Paul Mackerrasa66b48c2012-09-11 13:27:46 +0000198 physp = memslot->arch.slot_phys;
Paul Mackerras342d3db2011-12-12 12:38:05 +0000199 if (!physp)
200 return H_PARAMETER;
201 physp += slot_fn;
202 if (realmode)
203 physp = real_vmalloc_addr(physp);
204 pa = *physp;
205 if (!pa)
206 return H_TOO_HARD;
207 is_io = pa & (HPTE_R_I | HPTE_R_W);
208 pte_size = PAGE_SIZE << (pa & KVMPPC_PAGE_ORDER_MASK);
209 pa &= PAGE_MASK;
210 } else {
211 /* Translate to host virtual address */
Gavin Shan66a03502012-08-24 16:50:28 +0800212 hva = __gfn_to_hva_memslot(memslot, gfn);
Paul Mackerrasb2b2f162011-12-12 12:28:21 +0000213
Paul Mackerras342d3db2011-12-12 12:38:05 +0000214 /* Look up the Linux PTE for the backing page */
215 pte_size = psize;
Paul Mackerras7ed661b2012-11-13 18:31:32 +0000216 pte = lookup_linux_pte(pgdir, hva, writing, &pte_size);
Paul Mackerras342d3db2011-12-12 12:38:05 +0000217 if (pte_present(pte)) {
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000218 if (writing && !pte_write(pte))
219 /* make the actual HPTE be read-only */
220 ptel = hpte_make_readonly(ptel);
Paul Mackerras342d3db2011-12-12 12:38:05 +0000221 is_io = hpte_cache_bits(pte_val(pte));
222 pa = pte_pfn(pte) << PAGE_SHIFT;
223 }
224 }
Paul Mackerras7ed661b2012-11-13 18:31:32 +0000225
Paul Mackerrasc77162d2011-12-12 12:31:00 +0000226 if (pte_size < psize)
227 return H_PARAMETER;
228 if (pa && pte_size > psize)
229 pa |= gpa & (pte_size - 1);
230
231 ptel &= ~(HPTE_R_PP0 - psize);
232 ptel |= pa;
Paul Mackerras342d3db2011-12-12 12:38:05 +0000233
234 if (pa)
235 pteh |= HPTE_V_VALID;
236 else
237 pteh |= HPTE_V_ABSENT;
Paul Mackerrasc77162d2011-12-12 12:31:00 +0000238
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000239 /* Check WIMG */
Paul Mackerras342d3db2011-12-12 12:38:05 +0000240 if (is_io != ~0ul && !hpte_cache_flags_ok(ptel, is_io)) {
Paul Mackerras9d0ef5ea2011-12-12 12:32:27 +0000241 if (is_io)
242 return H_PARAMETER;
243 /*
244 * Allow guest to map emulated device memory as
245 * uncacheable, but actually make it cacheable.
246 */
247 ptel &= ~(HPTE_R_W|HPTE_R_I|HPTE_R_G);
248 ptel |= HPTE_R_M;
249 }
Paul Mackerras075295d2011-12-12 12:30:16 +0000250
Paul Mackerras342d3db2011-12-12 12:38:05 +0000251 /* Find and lock the HPTEG slot to use */
Paul Mackerras697d3892011-12-12 12:36:37 +0000252 do_insert:
Paul Mackerras32fad282012-05-04 02:32:53 +0000253 if (pte_index >= kvm->arch.hpt_npte)
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000254 return H_PARAMETER;
255 if (likely((flags & H_EXACT) == 0)) {
256 pte_index &= ~7UL;
257 hpte = (unsigned long *)(kvm->arch.hpt_virt + (pte_index << 4));
Paul Mackerras075295d2011-12-12 12:30:16 +0000258 for (i = 0; i < 8; ++i) {
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000259 if ((*hpte & HPTE_V_VALID) == 0 &&
Paul Mackerras697d3892011-12-12 12:36:37 +0000260 try_lock_hpte(hpte, HPTE_V_HVLOCK | HPTE_V_VALID |
261 HPTE_V_ABSENT))
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000262 break;
263 hpte += 2;
264 }
Paul Mackerras075295d2011-12-12 12:30:16 +0000265 if (i == 8) {
266 /*
267 * Since try_lock_hpte doesn't retry (not even stdcx.
268 * failures), it could be that there is a free slot
269 * but we transiently failed to lock it. Try again,
270 * actually locking each slot and checking it.
271 */
272 hpte -= 16;
273 for (i = 0; i < 8; ++i) {
274 while (!try_lock_hpte(hpte, HPTE_V_HVLOCK))
275 cpu_relax();
Paul Mackerras697d3892011-12-12 12:36:37 +0000276 if (!(*hpte & (HPTE_V_VALID | HPTE_V_ABSENT)))
Paul Mackerras075295d2011-12-12 12:30:16 +0000277 break;
278 *hpte &= ~HPTE_V_HVLOCK;
279 hpte += 2;
280 }
281 if (i == 8)
282 return H_PTEG_FULL;
283 }
Paul Mackerras8936dda2011-12-12 12:27:39 +0000284 pte_index += i;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000285 } else {
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000286 hpte = (unsigned long *)(kvm->arch.hpt_virt + (pte_index << 4));
Paul Mackerras697d3892011-12-12 12:36:37 +0000287 if (!try_lock_hpte(hpte, HPTE_V_HVLOCK | HPTE_V_VALID |
288 HPTE_V_ABSENT)) {
Paul Mackerras075295d2011-12-12 12:30:16 +0000289 /* Lock the slot and check again */
290 while (!try_lock_hpte(hpte, HPTE_V_HVLOCK))
291 cpu_relax();
Paul Mackerras697d3892011-12-12 12:36:37 +0000292 if (*hpte & (HPTE_V_VALID | HPTE_V_ABSENT)) {
Paul Mackerras075295d2011-12-12 12:30:16 +0000293 *hpte &= ~HPTE_V_HVLOCK;
294 return H_PTEG_FULL;
295 }
296 }
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000297 }
Paul Mackerras8936dda2011-12-12 12:27:39 +0000298
299 /* Save away the guest's idea of the second HPTE dword */
Paul Mackerras06ce2c62011-12-12 12:33:07 +0000300 rev = &kvm->arch.revmap[pte_index];
301 if (realmode)
302 rev = real_vmalloc_addr(rev);
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000303 if (rev) {
Paul Mackerras8936dda2011-12-12 12:27:39 +0000304 rev->guest_rpte = g_ptel;
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000305 note_hpte_modification(kvm, rev);
306 }
Paul Mackerras06ce2c62011-12-12 12:33:07 +0000307
308 /* Link HPTE into reverse-map chain */
Paul Mackerras697d3892011-12-12 12:36:37 +0000309 if (pteh & HPTE_V_VALID) {
310 if (realmode)
311 rmap = real_vmalloc_addr(rmap);
312 lock_rmap(rmap);
Paul Mackerras342d3db2011-12-12 12:38:05 +0000313 /* Check for pending invalidations under the rmap chain lock */
314 if (kvm->arch.using_mmu_notifiers &&
Paul Mackerras7ed661b2012-11-13 18:31:32 +0000315 mmu_notifier_retry(kvm, mmu_seq)) {
Paul Mackerras342d3db2011-12-12 12:38:05 +0000316 /* inval in progress, write a non-present HPTE */
317 pteh |= HPTE_V_ABSENT;
318 pteh &= ~HPTE_V_VALID;
319 unlock_rmap(rmap);
320 } else {
321 kvmppc_add_revmap_chain(kvm, rev, rmap, pte_index,
322 realmode);
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000323 /* Only set R/C in real HPTE if already set in *rmap */
324 rcbits = *rmap >> KVMPPC_RMAP_RC_SHIFT;
325 ptel &= rcbits | ~(HPTE_R_R | HPTE_R_C);
Paul Mackerras342d3db2011-12-12 12:38:05 +0000326 }
Paul Mackerras697d3892011-12-12 12:36:37 +0000327 }
Paul Mackerras06ce2c62011-12-12 12:33:07 +0000328
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000329 hpte[1] = ptel;
Paul Mackerras06ce2c62011-12-12 12:33:07 +0000330
331 /* Write the first HPTE dword, unlocking the HPTE and making it valid */
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000332 eieio();
333 hpte[0] = pteh;
334 asm volatile("ptesync" : : : "memory");
Paul Mackerras06ce2c62011-12-12 12:33:07 +0000335
Paul Mackerras7ed661b2012-11-13 18:31:32 +0000336 *pte_idx_ret = pte_index;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000337 return H_SUCCESS;
338}
Paul Mackerras7ed661b2012-11-13 18:31:32 +0000339EXPORT_SYMBOL_GPL(kvmppc_do_h_enter);
340
341long kvmppc_h_enter(struct kvm_vcpu *vcpu, unsigned long flags,
342 long pte_index, unsigned long pteh, unsigned long ptel)
343{
344 return kvmppc_do_h_enter(vcpu->kvm, flags, pte_index, pteh, ptel,
345 vcpu->arch.pgdir, true, &vcpu->arch.gpr[4]);
346}
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000347
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000348#define LOCK_TOKEN (*(u32 *)(&get_paca()->lock_token))
349
350static inline int try_lock_tlbie(unsigned int *lock)
351{
352 unsigned int tmp, old;
353 unsigned int token = LOCK_TOKEN;
354
355 asm volatile("1:lwarx %1,0,%2\n"
356 " cmpwi cr0,%1,0\n"
357 " bne 2f\n"
358 " stwcx. %3,0,%2\n"
359 " bne- 1b\n"
360 " isync\n"
361 "2:"
362 : "=&r" (tmp), "=&r" (old)
363 : "r" (lock), "r" (token)
364 : "cc", "memory");
365 return old == 0;
366}
367
Paul Mackerras6b445ad2012-11-19 22:55:44 +0000368long kvmppc_do_h_remove(struct kvm *kvm, unsigned long flags,
369 unsigned long pte_index, unsigned long avpn,
370 unsigned long *hpret)
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000371{
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000372 unsigned long *hpte;
373 unsigned long v, r, rb;
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000374 struct revmap_entry *rev;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000375
Paul Mackerras32fad282012-05-04 02:32:53 +0000376 if (pte_index >= kvm->arch.hpt_npte)
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000377 return H_PARAMETER;
378 hpte = (unsigned long *)(kvm->arch.hpt_virt + (pte_index << 4));
Paul Mackerras075295d2011-12-12 12:30:16 +0000379 while (!try_lock_hpte(hpte, HPTE_V_HVLOCK))
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000380 cpu_relax();
Paul Mackerras697d3892011-12-12 12:36:37 +0000381 if ((hpte[0] & (HPTE_V_ABSENT | HPTE_V_VALID)) == 0 ||
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000382 ((flags & H_AVPN) && (hpte[0] & ~0x7fUL) != avpn) ||
383 ((flags & H_ANDCOND) && (hpte[0] & avpn) != 0)) {
384 hpte[0] &= ~HPTE_V_HVLOCK;
385 return H_NOT_FOUND;
386 }
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000387
388 rev = real_vmalloc_addr(&kvm->arch.revmap[pte_index]);
389 v = hpte[0] & ~HPTE_V_HVLOCK;
390 if (v & HPTE_V_VALID) {
391 hpte[0] &= ~HPTE_V_VALID;
392 rb = compute_tlbie_rb(v, hpte[1], pte_index);
393 if (!(flags & H_LOCAL) && atomic_read(&kvm->online_vcpus) > 1) {
394 while (!try_lock_tlbie(&kvm->arch.tlbie_lock))
395 cpu_relax();
396 asm volatile("ptesync" : : : "memory");
397 asm volatile(PPC_TLBIE(%1,%0)"; eieio; tlbsync"
398 : : "r" (rb), "r" (kvm->arch.lpid));
399 asm volatile("ptesync" : : : "memory");
400 kvm->arch.tlbie_lock = 0;
401 } else {
402 asm volatile("ptesync" : : : "memory");
403 asm volatile("tlbiel %0" : : "r" (rb));
404 asm volatile("ptesync" : : : "memory");
405 }
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000406 /* Read PTE low word after tlbie to get final R/C values */
407 remove_revmap_chain(kvm, pte_index, rev, v, hpte[1]);
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000408 }
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000409 r = rev->guest_rpte & ~HPTE_GR_RESERVED;
410 note_hpte_modification(kvm, rev);
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000411 unlock_hpte(hpte, 0);
412
Paul Mackerras6b445ad2012-11-19 22:55:44 +0000413 hpret[0] = v;
414 hpret[1] = r;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000415 return H_SUCCESS;
416}
Paul Mackerras6b445ad2012-11-19 22:55:44 +0000417EXPORT_SYMBOL_GPL(kvmppc_do_h_remove);
418
419long kvmppc_h_remove(struct kvm_vcpu *vcpu, unsigned long flags,
420 unsigned long pte_index, unsigned long avpn)
421{
422 return kvmppc_do_h_remove(vcpu->kvm, flags, pte_index, avpn,
423 &vcpu->arch.gpr[4]);
424}
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000425
426long kvmppc_h_bulk_remove(struct kvm_vcpu *vcpu)
427{
428 struct kvm *kvm = vcpu->kvm;
429 unsigned long *args = &vcpu->arch.gpr[4];
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000430 unsigned long *hp, *hptes[4], tlbrb[4];
431 long int i, j, k, n, found, indexes[4];
432 unsigned long flags, req, pte_index, rcbits;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000433 long int local = 0;
434 long int ret = H_SUCCESS;
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000435 struct revmap_entry *rev, *revs[4];
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000436
437 if (atomic_read(&kvm->online_vcpus) == 1)
438 local = 1;
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000439 for (i = 0; i < 4 && ret == H_SUCCESS; ) {
440 n = 0;
441 for (; i < 4; ++i) {
442 j = i * 2;
443 pte_index = args[j];
444 flags = pte_index >> 56;
445 pte_index &= ((1ul << 56) - 1);
446 req = flags >> 6;
447 flags &= 3;
448 if (req == 3) { /* no more requests */
449 i = 4;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000450 break;
451 }
Paul Mackerras32fad282012-05-04 02:32:53 +0000452 if (req != 1 || flags == 3 ||
453 pte_index >= kvm->arch.hpt_npte) {
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000454 /* parameter error */
455 args[j] = ((0xa0 | flags) << 56) + pte_index;
456 ret = H_PARAMETER;
457 break;
458 }
459 hp = (unsigned long *)
460 (kvm->arch.hpt_virt + (pte_index << 4));
461 /* to avoid deadlock, don't spin except for first */
462 if (!try_lock_hpte(hp, HPTE_V_HVLOCK)) {
463 if (n)
464 break;
465 while (!try_lock_hpte(hp, HPTE_V_HVLOCK))
466 cpu_relax();
467 }
468 found = 0;
469 if (hp[0] & (HPTE_V_ABSENT | HPTE_V_VALID)) {
470 switch (flags & 3) {
471 case 0: /* absolute */
472 found = 1;
473 break;
474 case 1: /* andcond */
475 if (!(hp[0] & args[j + 1]))
476 found = 1;
477 break;
478 case 2: /* AVPN */
479 if ((hp[0] & ~0x7fUL) == args[j + 1])
480 found = 1;
481 break;
482 }
483 }
484 if (!found) {
485 hp[0] &= ~HPTE_V_HVLOCK;
486 args[j] = ((0x90 | flags) << 56) + pte_index;
487 continue;
488 }
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000489
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000490 args[j] = ((0x80 | flags) << 56) + pte_index;
491 rev = real_vmalloc_addr(&kvm->arch.revmap[pte_index]);
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000492 note_hpte_modification(kvm, rev);
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000493
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000494 if (!(hp[0] & HPTE_V_VALID)) {
495 /* insert R and C bits from PTE */
496 rcbits = rev->guest_rpte & (HPTE_R_R|HPTE_R_C);
497 args[j] |= rcbits << (56 - 5);
Paul Mackerras51bfd292012-05-09 23:49:24 +0000498 hp[0] = 0;
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000499 continue;
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000500 }
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000501
502 hp[0] &= ~HPTE_V_VALID; /* leave it locked */
503 tlbrb[n] = compute_tlbie_rb(hp[0], hp[1], pte_index);
504 indexes[n] = j;
505 hptes[n] = hp;
506 revs[n] = rev;
507 ++n;
508 }
509
510 if (!n)
511 break;
512
513 /* Now that we've collected a batch, do the tlbies */
514 if (!local) {
515 while(!try_lock_tlbie(&kvm->arch.tlbie_lock))
516 cpu_relax();
517 asm volatile("ptesync" : : : "memory");
518 for (k = 0; k < n; ++k)
519 asm volatile(PPC_TLBIE(%1,%0) : :
520 "r" (tlbrb[k]),
521 "r" (kvm->arch.lpid));
522 asm volatile("eieio; tlbsync; ptesync" : : : "memory");
523 kvm->arch.tlbie_lock = 0;
524 } else {
525 asm volatile("ptesync" : : : "memory");
526 for (k = 0; k < n; ++k)
527 asm volatile("tlbiel %0" : : "r" (tlbrb[k]));
528 asm volatile("ptesync" : : : "memory");
529 }
530
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000531 /* Read PTE low words after tlbie to get final R/C values */
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000532 for (k = 0; k < n; ++k) {
533 j = indexes[k];
534 pte_index = args[j] & ((1ul << 56) - 1);
535 hp = hptes[k];
536 rev = revs[k];
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000537 remove_revmap_chain(kvm, pte_index, rev, hp[0], hp[1]);
538 rcbits = rev->guest_rpte & (HPTE_R_R|HPTE_R_C);
539 args[j] |= rcbits << (56 - 5);
540 hp[0] = 0;
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000541 }
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000542 }
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000543
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000544 return ret;
545}
546
547long kvmppc_h_protect(struct kvm_vcpu *vcpu, unsigned long flags,
548 unsigned long pte_index, unsigned long avpn,
549 unsigned long va)
550{
551 struct kvm *kvm = vcpu->kvm;
552 unsigned long *hpte;
Paul Mackerras8936dda2011-12-12 12:27:39 +0000553 struct revmap_entry *rev;
554 unsigned long v, r, rb, mask, bits;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000555
Paul Mackerras32fad282012-05-04 02:32:53 +0000556 if (pte_index >= kvm->arch.hpt_npte)
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000557 return H_PARAMETER;
Paul Mackerras697d3892011-12-12 12:36:37 +0000558
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000559 hpte = (unsigned long *)(kvm->arch.hpt_virt + (pte_index << 4));
Paul Mackerras075295d2011-12-12 12:30:16 +0000560 while (!try_lock_hpte(hpte, HPTE_V_HVLOCK))
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000561 cpu_relax();
Paul Mackerras697d3892011-12-12 12:36:37 +0000562 if ((hpte[0] & (HPTE_V_ABSENT | HPTE_V_VALID)) == 0 ||
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000563 ((flags & H_AVPN) && (hpte[0] & ~0x7fUL) != avpn)) {
564 hpte[0] &= ~HPTE_V_HVLOCK;
565 return H_NOT_FOUND;
566 }
Paul Mackerras697d3892011-12-12 12:36:37 +0000567
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000568 if (atomic_read(&kvm->online_vcpus) == 1)
569 flags |= H_LOCAL;
570 v = hpte[0];
Paul Mackerras8936dda2011-12-12 12:27:39 +0000571 bits = (flags << 55) & HPTE_R_PP0;
572 bits |= (flags << 48) & HPTE_R_KEY_HI;
573 bits |= flags & (HPTE_R_PP | HPTE_R_N | HPTE_R_KEY_LO);
574
575 /* Update guest view of 2nd HPTE dword */
576 mask = HPTE_R_PP0 | HPTE_R_PP | HPTE_R_N |
577 HPTE_R_KEY_HI | HPTE_R_KEY_LO;
578 rev = real_vmalloc_addr(&kvm->arch.revmap[pte_index]);
579 if (rev) {
580 r = (rev->guest_rpte & ~mask) | bits;
581 rev->guest_rpte = r;
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000582 note_hpte_modification(kvm, rev);
Paul Mackerras8936dda2011-12-12 12:27:39 +0000583 }
584 r = (hpte[1] & ~mask) | bits;
585
586 /* Update HPTE */
Paul Mackerras697d3892011-12-12 12:36:37 +0000587 if (v & HPTE_V_VALID) {
588 rb = compute_tlbie_rb(v, r, pte_index);
589 hpte[0] = v & ~HPTE_V_VALID;
590 if (!(flags & H_LOCAL)) {
591 while(!try_lock_tlbie(&kvm->arch.tlbie_lock))
592 cpu_relax();
593 asm volatile("ptesync" : : : "memory");
594 asm volatile(PPC_TLBIE(%1,%0)"; eieio; tlbsync"
595 : : "r" (rb), "r" (kvm->arch.lpid));
596 asm volatile("ptesync" : : : "memory");
597 kvm->arch.tlbie_lock = 0;
598 } else {
599 asm volatile("ptesync" : : : "memory");
600 asm volatile("tlbiel %0" : : "r" (rb));
601 asm volatile("ptesync" : : : "memory");
602 }
Paul Mackerras1cc8ed02012-11-21 23:28:41 +0000603 /*
604 * If the host has this page as readonly but the guest
605 * wants to make it read/write, reduce the permissions.
606 * Checking the host permissions involves finding the
607 * memslot and then the Linux PTE for the page.
608 */
609 if (hpte_is_writable(r) && kvm->arch.using_mmu_notifiers) {
610 unsigned long psize, gfn, hva;
611 struct kvm_memory_slot *memslot;
612 pgd_t *pgdir = vcpu->arch.pgdir;
613 pte_t pte;
614
615 psize = hpte_page_size(v, r);
616 gfn = ((r & HPTE_R_RPN) & ~(psize - 1)) >> PAGE_SHIFT;
617 memslot = __gfn_to_memslot(kvm_memslots(kvm), gfn);
618 if (memslot) {
619 hva = __gfn_to_hva_memslot(memslot, gfn);
620 pte = lookup_linux_pte(pgdir, hva, 1, &psize);
621 if (pte_present(pte) && !pte_write(pte))
622 r = hpte_make_readonly(r);
623 }
624 }
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000625 }
626 hpte[1] = r;
627 eieio();
628 hpte[0] = v & ~HPTE_V_HVLOCK;
629 asm volatile("ptesync" : : : "memory");
630 return H_SUCCESS;
631}
632
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000633long kvmppc_h_read(struct kvm_vcpu *vcpu, unsigned long flags,
634 unsigned long pte_index)
635{
636 struct kvm *kvm = vcpu->kvm;
Paul Mackerras697d3892011-12-12 12:36:37 +0000637 unsigned long *hpte, v, r;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000638 int i, n = 1;
Paul Mackerras8936dda2011-12-12 12:27:39 +0000639 struct revmap_entry *rev = NULL;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000640
Paul Mackerras32fad282012-05-04 02:32:53 +0000641 if (pte_index >= kvm->arch.hpt_npte)
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000642 return H_PARAMETER;
643 if (flags & H_READ_4) {
644 pte_index &= ~3;
645 n = 4;
646 }
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000647 rev = real_vmalloc_addr(&kvm->arch.revmap[pte_index]);
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000648 for (i = 0; i < n; ++i, ++pte_index) {
649 hpte = (unsigned long *)(kvm->arch.hpt_virt + (pte_index << 4));
Paul Mackerras697d3892011-12-12 12:36:37 +0000650 v = hpte[0] & ~HPTE_V_HVLOCK;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000651 r = hpte[1];
Paul Mackerras697d3892011-12-12 12:36:37 +0000652 if (v & HPTE_V_ABSENT) {
653 v &= ~HPTE_V_ABSENT;
654 v |= HPTE_V_VALID;
655 }
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000656 if (v & HPTE_V_VALID) {
Paul Mackerrasbad3b502011-12-15 02:02:02 +0000657 r = rev[i].guest_rpte | (r & (HPTE_R_R | HPTE_R_C));
Paul Mackerras44e5f6b2012-11-19 22:52:49 +0000658 r &= ~HPTE_GR_RESERVED;
659 }
Paul Mackerras697d3892011-12-12 12:36:37 +0000660 vcpu->arch.gpr[4 + i * 2] = v;
Paul Mackerrasa8606e22011-06-29 00:22:05 +0000661 vcpu->arch.gpr[5 + i * 2] = r;
662 }
663 return H_SUCCESS;
664}
Paul Mackerras697d3892011-12-12 12:36:37 +0000665
Paul Mackerras342d3db2011-12-12 12:38:05 +0000666void kvmppc_invalidate_hpte(struct kvm *kvm, unsigned long *hptep,
667 unsigned long pte_index)
668{
669 unsigned long rb;
670
671 hptep[0] &= ~HPTE_V_VALID;
672 rb = compute_tlbie_rb(hptep[0], hptep[1], pte_index);
673 while (!try_lock_tlbie(&kvm->arch.tlbie_lock))
674 cpu_relax();
675 asm volatile("ptesync" : : : "memory");
676 asm volatile(PPC_TLBIE(%1,%0)"; eieio; tlbsync"
677 : : "r" (rb), "r" (kvm->arch.lpid));
678 asm volatile("ptesync" : : : "memory");
679 kvm->arch.tlbie_lock = 0;
680}
681EXPORT_SYMBOL_GPL(kvmppc_invalidate_hpte);
682
Paul Mackerras55514892011-12-15 02:02:47 +0000683void kvmppc_clear_ref_hpte(struct kvm *kvm, unsigned long *hptep,
684 unsigned long pte_index)
685{
686 unsigned long rb;
687 unsigned char rbyte;
688
689 rb = compute_tlbie_rb(hptep[0], hptep[1], pte_index);
690 rbyte = (hptep[1] & ~HPTE_R_R) >> 8;
691 /* modify only the second-last byte, which contains the ref bit */
692 *((char *)hptep + 14) = rbyte;
693 while (!try_lock_tlbie(&kvm->arch.tlbie_lock))
694 cpu_relax();
695 asm volatile(PPC_TLBIE(%1,%0)"; eieio; tlbsync"
696 : : "r" (rb), "r" (kvm->arch.lpid));
697 asm volatile("ptesync" : : : "memory");
698 kvm->arch.tlbie_lock = 0;
699}
700EXPORT_SYMBOL_GPL(kvmppc_clear_ref_hpte);
701
Paul Mackerras697d3892011-12-12 12:36:37 +0000702static int slb_base_page_shift[4] = {
703 24, /* 16M */
704 16, /* 64k */
705 34, /* 16G */
706 20, /* 1M, unsupported */
707};
708
709long kvmppc_hv_find_lock_hpte(struct kvm *kvm, gva_t eaddr, unsigned long slb_v,
710 unsigned long valid)
711{
712 unsigned int i;
713 unsigned int pshift;
714 unsigned long somask;
715 unsigned long vsid, hash;
716 unsigned long avpn;
717 unsigned long *hpte;
718 unsigned long mask, val;
719 unsigned long v, r;
720
721 /* Get page shift, work out hash and AVPN etc. */
722 mask = SLB_VSID_B | HPTE_V_AVPN | HPTE_V_SECONDARY;
723 val = 0;
724 pshift = 12;
725 if (slb_v & SLB_VSID_L) {
726 mask |= HPTE_V_LARGE;
727 val |= HPTE_V_LARGE;
728 pshift = slb_base_page_shift[(slb_v & SLB_VSID_LP) >> 4];
729 }
730 if (slb_v & SLB_VSID_B_1T) {
731 somask = (1UL << 40) - 1;
732 vsid = (slb_v & ~SLB_VSID_B) >> SLB_VSID_SHIFT_1T;
733 vsid ^= vsid << 25;
734 } else {
735 somask = (1UL << 28) - 1;
736 vsid = (slb_v & ~SLB_VSID_B) >> SLB_VSID_SHIFT;
737 }
Paul Mackerras32fad282012-05-04 02:32:53 +0000738 hash = (vsid ^ ((eaddr & somask) >> pshift)) & kvm->arch.hpt_mask;
Paul Mackerras697d3892011-12-12 12:36:37 +0000739 avpn = slb_v & ~(somask >> 16); /* also includes B */
740 avpn |= (eaddr & somask) >> 16;
741
742 if (pshift >= 24)
743 avpn &= ~((1UL << (pshift - 16)) - 1);
744 else
745 avpn &= ~0x7fUL;
746 val |= avpn;
747
748 for (;;) {
749 hpte = (unsigned long *)(kvm->arch.hpt_virt + (hash << 7));
750
751 for (i = 0; i < 16; i += 2) {
752 /* Read the PTE racily */
753 v = hpte[i] & ~HPTE_V_HVLOCK;
754
755 /* Check valid/absent, hash, segment size and AVPN */
756 if (!(v & valid) || (v & mask) != val)
757 continue;
758
759 /* Lock the PTE and read it under the lock */
760 while (!try_lock_hpte(&hpte[i], HPTE_V_HVLOCK))
761 cpu_relax();
762 v = hpte[i] & ~HPTE_V_HVLOCK;
763 r = hpte[i+1];
764
765 /*
766 * Check the HPTE again, including large page size
767 * Since we don't currently allow any MPSS (mixed
768 * page-size segment) page sizes, it is sufficient
769 * to check against the actual page size.
770 */
771 if ((v & valid) && (v & mask) == val &&
772 hpte_page_size(v, r) == (1ul << pshift))
773 /* Return with the HPTE still locked */
774 return (hash << 3) + (i >> 1);
775
776 /* Unlock and move on */
777 hpte[i] = v;
778 }
779
780 if (val & HPTE_V_SECONDARY)
781 break;
782 val |= HPTE_V_SECONDARY;
Paul Mackerras32fad282012-05-04 02:32:53 +0000783 hash = hash ^ kvm->arch.hpt_mask;
Paul Mackerras697d3892011-12-12 12:36:37 +0000784 }
785 return -1;
786}
787EXPORT_SYMBOL(kvmppc_hv_find_lock_hpte);
788
789/*
790 * Called in real mode to check whether an HPTE not found fault
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000791 * is due to accessing a paged-out page or an emulated MMIO page,
792 * or if a protection fault is due to accessing a page that the
793 * guest wanted read/write access to but which we made read-only.
Paul Mackerras697d3892011-12-12 12:36:37 +0000794 * Returns a possibly modified status (DSISR) value if not
795 * (i.e. pass the interrupt to the guest),
796 * -1 to pass the fault up to host kernel mode code, -2 to do that
Paul Mackerras342d3db2011-12-12 12:38:05 +0000797 * and also load the instruction word (for MMIO emulation),
Paul Mackerras697d3892011-12-12 12:36:37 +0000798 * or 0 if we should make the guest retry the access.
799 */
800long kvmppc_hpte_hv_fault(struct kvm_vcpu *vcpu, unsigned long addr,
Paul Mackerras342d3db2011-12-12 12:38:05 +0000801 unsigned long slb_v, unsigned int status, bool data)
Paul Mackerras697d3892011-12-12 12:36:37 +0000802{
803 struct kvm *kvm = vcpu->kvm;
804 long int index;
805 unsigned long v, r, gr;
806 unsigned long *hpte;
807 unsigned long valid;
808 struct revmap_entry *rev;
809 unsigned long pp, key;
810
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000811 /* For protection fault, expect to find a valid HPTE */
812 valid = HPTE_V_VALID;
813 if (status & DSISR_NOHPTE)
814 valid |= HPTE_V_ABSENT;
Paul Mackerras342d3db2011-12-12 12:38:05 +0000815
Paul Mackerras697d3892011-12-12 12:36:37 +0000816 index = kvmppc_hv_find_lock_hpte(kvm, addr, slb_v, valid);
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000817 if (index < 0) {
818 if (status & DSISR_NOHPTE)
819 return status; /* there really was no HPTE */
820 return 0; /* for prot fault, HPTE disappeared */
821 }
Paul Mackerras697d3892011-12-12 12:36:37 +0000822 hpte = (unsigned long *)(kvm->arch.hpt_virt + (index << 4));
823 v = hpte[0] & ~HPTE_V_HVLOCK;
824 r = hpte[1];
825 rev = real_vmalloc_addr(&kvm->arch.revmap[index]);
826 gr = rev->guest_rpte;
827
Paul Mackerrasa92bce92011-12-15 02:01:10 +0000828 unlock_hpte(hpte, v);
Paul Mackerras697d3892011-12-12 12:36:37 +0000829
Paul Mackerras4cf302b2011-12-12 12:38:51 +0000830 /* For not found, if the HPTE is valid by now, retry the instruction */
831 if ((status & DSISR_NOHPTE) && (v & HPTE_V_VALID))
Paul Mackerras697d3892011-12-12 12:36:37 +0000832 return 0;
833
834 /* Check access permissions to the page */
835 pp = gr & (HPTE_R_PP0 | HPTE_R_PP);
836 key = (vcpu->arch.shregs.msr & MSR_PR) ? SLB_VSID_KP : SLB_VSID_KS;
Paul Mackerras342d3db2011-12-12 12:38:05 +0000837 status &= ~DSISR_NOHPTE; /* DSISR_NOHPTE == SRR1_ISI_NOPT */
838 if (!data) {
839 if (gr & (HPTE_R_N | HPTE_R_G))
840 return status | SRR1_ISI_N_OR_G;
841 if (!hpte_read_permission(pp, slb_v & key))
842 return status | SRR1_ISI_PROT;
843 } else if (status & DSISR_ISSTORE) {
Paul Mackerras697d3892011-12-12 12:36:37 +0000844 /* check write permission */
845 if (!hpte_write_permission(pp, slb_v & key))
Paul Mackerras342d3db2011-12-12 12:38:05 +0000846 return status | DSISR_PROTFAULT;
Paul Mackerras697d3892011-12-12 12:36:37 +0000847 } else {
848 if (!hpte_read_permission(pp, slb_v & key))
Paul Mackerras342d3db2011-12-12 12:38:05 +0000849 return status | DSISR_PROTFAULT;
Paul Mackerras697d3892011-12-12 12:36:37 +0000850 }
851
852 /* Check storage key, if applicable */
Paul Mackerras342d3db2011-12-12 12:38:05 +0000853 if (data && (vcpu->arch.shregs.msr & MSR_DR)) {
Paul Mackerras697d3892011-12-12 12:36:37 +0000854 unsigned int perm = hpte_get_skey_perm(gr, vcpu->arch.amr);
855 if (status & DSISR_ISSTORE)
856 perm >>= 1;
857 if (perm & 1)
Paul Mackerras342d3db2011-12-12 12:38:05 +0000858 return status | DSISR_KEYFAULT;
Paul Mackerras697d3892011-12-12 12:36:37 +0000859 }
860
861 /* Save HPTE info for virtual-mode handler */
862 vcpu->arch.pgfault_addr = addr;
863 vcpu->arch.pgfault_index = index;
864 vcpu->arch.pgfault_hpte[0] = v;
865 vcpu->arch.pgfault_hpte[1] = r;
866
Paul Mackerras342d3db2011-12-12 12:38:05 +0000867 /* Check the storage key to see if it is possibly emulated MMIO */
868 if (data && (vcpu->arch.shregs.msr & MSR_IR) &&
869 (r & (HPTE_R_KEY_HI | HPTE_R_KEY_LO)) ==
870 (HPTE_R_KEY_HI | HPTE_R_KEY_LO))
Paul Mackerras697d3892011-12-12 12:36:37 +0000871 return -2; /* MMIO emulation - load instr word */
872
873 return -1; /* send fault up to host kernel mode */
Paul Mackerras697d3892011-12-12 12:36:37 +0000874}