Commit | Line | Data |
---|---|---|
1da177e4 LT |
1 | /* |
2 | * pSeries_lpar.c | |
3 | * Copyright (C) 2001 Todd Inglett, IBM Corporation | |
4 | * | |
5 | * pSeries LPAR support. | |
6 | * | |
7 | * This program is free software; you can redistribute it and/or modify | |
8 | * it under the terms of the GNU General Public License as published by | |
9 | * the Free Software Foundation; either version 2 of the License, or | |
10 | * (at your option) any later version. | |
11 | * | |
12 | * This program is distributed in the hope that it will be useful, | |
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
15 | * GNU General Public License for more details. | |
16 | * | |
17 | * You should have received a copy of the GNU General Public License | |
18 | * along with this program; if not, write to the Free Software | |
19 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | |
20 | */ | |
21 | ||
22 | #define DEBUG | |
23 | ||
24 | #include <linux/config.h> | |
25 | #include <linux/kernel.h> | |
26 | #include <linux/dma-mapping.h> | |
27 | #include <asm/processor.h> | |
28 | #include <asm/mmu.h> | |
29 | #include <asm/page.h> | |
30 | #include <asm/pgtable.h> | |
31 | #include <asm/machdep.h> | |
32 | #include <asm/abs_addr.h> | |
33 | #include <asm/mmu_context.h> | |
34 | #include <asm/ppcdebug.h> | |
35 | #include <asm/iommu.h> | |
36 | #include <asm/tlbflush.h> | |
37 | #include <asm/tlb.h> | |
38 | #include <asm/prom.h> | |
39 | #include <asm/abs_addr.h> | |
40 | #include <asm/cputable.h> | |
41 | #include <asm/plpar_wrappers.h> | |
42 | ||
43 | #ifdef DEBUG | |
44 | #define DBG(fmt...) udbg_printf(fmt) | |
45 | #else | |
46 | #define DBG(fmt...) | |
47 | #endif | |
48 | ||
49 | /* in pSeries_hvCall.S */ | |
50 | EXPORT_SYMBOL(plpar_hcall); | |
51 | EXPORT_SYMBOL(plpar_hcall_4out); | |
52 | EXPORT_SYMBOL(plpar_hcall_norets); | |
53 | EXPORT_SYMBOL(plpar_hcall_8arg_2ret); | |
54 | ||
55 | extern void fw_feature_init(void); | |
56 | extern void pSeries_find_serial_port(void); | |
57 | ||
58 | ||
59 | int vtermno; /* virtual terminal# for udbg */ | |
60 | ||
61 | #define __ALIGNED__ __attribute__((__aligned__(sizeof(long)))) | |
62 | static void udbg_hvsi_putc(unsigned char c) | |
63 | { | |
64 | /* packet's seqno isn't used anyways */ | |
65 | uint8_t packet[] __ALIGNED__ = { 0xff, 5, 0, 0, c }; | |
66 | int rc; | |
67 | ||
68 | if (c == '\n') | |
69 | udbg_hvsi_putc('\r'); | |
70 | ||
71 | do { | |
72 | rc = plpar_put_term_char(vtermno, sizeof(packet), packet); | |
73 | } while (rc == H_Busy); | |
74 | } | |
75 | ||
76 | static long hvsi_udbg_buf_len; | |
77 | static uint8_t hvsi_udbg_buf[256]; | |
78 | ||
79 | static int udbg_hvsi_getc_poll(void) | |
80 | { | |
81 | unsigned char ch; | |
82 | int rc, i; | |
83 | ||
84 | if (hvsi_udbg_buf_len == 0) { | |
85 | rc = plpar_get_term_char(vtermno, &hvsi_udbg_buf_len, hvsi_udbg_buf); | |
86 | if (rc != H_Success || hvsi_udbg_buf[0] != 0xff) { | |
87 | /* bad read or non-data packet */ | |
88 | hvsi_udbg_buf_len = 0; | |
89 | } else { | |
90 | /* remove the packet header */ | |
91 | for (i = 4; i < hvsi_udbg_buf_len; i++) | |
92 | hvsi_udbg_buf[i-4] = hvsi_udbg_buf[i]; | |
93 | hvsi_udbg_buf_len -= 4; | |
94 | } | |
95 | } | |
96 | ||
97 | if (hvsi_udbg_buf_len <= 0 || hvsi_udbg_buf_len > 256) { | |
98 | /* no data ready */ | |
99 | hvsi_udbg_buf_len = 0; | |
100 | return -1; | |
101 | } | |
102 | ||
103 | ch = hvsi_udbg_buf[0]; | |
104 | /* shift remaining data down */ | |
105 | for (i = 1; i < hvsi_udbg_buf_len; i++) { | |
106 | hvsi_udbg_buf[i-1] = hvsi_udbg_buf[i]; | |
107 | } | |
108 | hvsi_udbg_buf_len--; | |
109 | ||
110 | return ch; | |
111 | } | |
112 | ||
113 | static unsigned char udbg_hvsi_getc(void) | |
114 | { | |
115 | int ch; | |
116 | for (;;) { | |
117 | ch = udbg_hvsi_getc_poll(); | |
118 | if (ch == -1) { | |
119 | /* This shouldn't be needed...but... */ | |
120 | volatile unsigned long delay; | |
121 | for (delay=0; delay < 2000000; delay++) | |
122 | ; | |
123 | } else { | |
124 | return ch; | |
125 | } | |
126 | } | |
127 | } | |
128 | ||
129 | static void udbg_putcLP(unsigned char c) | |
130 | { | |
131 | char buf[16]; | |
132 | unsigned long rc; | |
133 | ||
134 | if (c == '\n') | |
135 | udbg_putcLP('\r'); | |
136 | ||
137 | buf[0] = c; | |
138 | do { | |
139 | rc = plpar_put_term_char(vtermno, 1, buf); | |
140 | } while(rc == H_Busy); | |
141 | } | |
142 | ||
143 | /* Buffered chars getc */ | |
144 | static long inbuflen; | |
145 | static long inbuf[2]; /* must be 2 longs */ | |
146 | ||
147 | static int udbg_getc_pollLP(void) | |
148 | { | |
149 | /* The interface is tricky because it may return up to 16 chars. | |
150 | * We save them statically for future calls to udbg_getc(). | |
151 | */ | |
152 | char ch, *buf = (char *)inbuf; | |
153 | int i; | |
154 | long rc; | |
155 | if (inbuflen == 0) { | |
156 | /* get some more chars. */ | |
157 | inbuflen = 0; | |
158 | rc = plpar_get_term_char(vtermno, &inbuflen, buf); | |
159 | if (rc != H_Success) | |
160 | inbuflen = 0; /* otherwise inbuflen is garbage */ | |
161 | } | |
162 | if (inbuflen <= 0 || inbuflen > 16) { | |
163 | /* Catch error case as well as other oddities (corruption) */ | |
164 | inbuflen = 0; | |
165 | return -1; | |
166 | } | |
167 | ch = buf[0]; | |
168 | for (i = 1; i < inbuflen; i++) /* shuffle them down. */ | |
169 | buf[i-1] = buf[i]; | |
170 | inbuflen--; | |
171 | return ch; | |
172 | } | |
173 | ||
174 | static unsigned char udbg_getcLP(void) | |
175 | { | |
176 | int ch; | |
177 | for (;;) { | |
178 | ch = udbg_getc_pollLP(); | |
179 | if (ch == -1) { | |
180 | /* This shouldn't be needed...but... */ | |
181 | volatile unsigned long delay; | |
182 | for (delay=0; delay < 2000000; delay++) | |
183 | ; | |
184 | } else { | |
185 | return ch; | |
186 | } | |
187 | } | |
188 | } | |
189 | ||
190 | /* call this from early_init() for a working debug console on | |
191 | * vterm capable LPAR machines | |
192 | */ | |
193 | void udbg_init_debug_lpar(void) | |
194 | { | |
195 | vtermno = 0; | |
196 | ppc_md.udbg_putc = udbg_putcLP; | |
197 | ppc_md.udbg_getc = udbg_getcLP; | |
198 | ppc_md.udbg_getc_poll = udbg_getc_pollLP; | |
199 | } | |
200 | ||
201 | /* returns 0 if couldn't find or use /chosen/stdout as console */ | |
202 | int find_udbg_vterm(void) | |
203 | { | |
204 | struct device_node *stdout_node; | |
205 | u32 *termno; | |
206 | char *name; | |
207 | int found = 0; | |
208 | ||
209 | /* find the boot console from /chosen/stdout */ | |
210 | if (!of_chosen) | |
211 | return 0; | |
212 | name = (char *)get_property(of_chosen, "linux,stdout-path", NULL); | |
213 | if (name == NULL) | |
214 | return 0; | |
215 | stdout_node = of_find_node_by_path(name); | |
216 | if (!stdout_node) | |
217 | return 0; | |
218 | ||
219 | /* now we have the stdout node; figure out what type of device it is. */ | |
220 | name = (char *)get_property(stdout_node, "name", NULL); | |
221 | if (!name) { | |
222 | printk(KERN_WARNING "stdout node missing 'name' property!\n"); | |
223 | goto out; | |
224 | } | |
225 | ||
226 | if (strncmp(name, "vty", 3) == 0) { | |
227 | if (device_is_compatible(stdout_node, "hvterm1")) { | |
228 | termno = (u32 *)get_property(stdout_node, "reg", NULL); | |
229 | if (termno) { | |
230 | vtermno = termno[0]; | |
231 | ppc_md.udbg_putc = udbg_putcLP; | |
232 | ppc_md.udbg_getc = udbg_getcLP; | |
233 | ppc_md.udbg_getc_poll = udbg_getc_pollLP; | |
234 | found = 1; | |
235 | } | |
236 | } else if (device_is_compatible(stdout_node, "hvterm-protocol")) { | |
237 | termno = (u32 *)get_property(stdout_node, "reg", NULL); | |
238 | if (termno) { | |
239 | vtermno = termno[0]; | |
240 | ppc_md.udbg_putc = udbg_hvsi_putc; | |
241 | ppc_md.udbg_getc = udbg_hvsi_getc; | |
242 | ppc_md.udbg_getc_poll = udbg_hvsi_getc_poll; | |
243 | found = 1; | |
244 | } | |
245 | } | |
246 | } else if (strncmp(name, "serial", 6)) { | |
247 | /* XXX fix ISA serial console */ | |
248 | printk(KERN_WARNING "serial stdout on LPAR ('%s')! " | |
249 | "can't print udbg messages\n", | |
250 | stdout_node->full_name); | |
251 | } else { | |
252 | printk(KERN_WARNING "don't know how to print to stdout '%s'\n", | |
253 | stdout_node->full_name); | |
254 | } | |
255 | ||
256 | out: | |
257 | of_node_put(stdout_node); | |
258 | return found; | |
259 | } | |
260 | ||
261 | void vpa_init(int cpu) | |
262 | { | |
263 | int hwcpu = get_hard_smp_processor_id(cpu); | |
264 | unsigned long vpa = (unsigned long)&(paca[cpu].lppaca); | |
265 | long ret; | |
266 | unsigned long flags; | |
267 | ||
268 | /* Register the Virtual Processor Area (VPA) */ | |
269 | flags = 1UL << (63 - 18); | |
270 | ret = register_vpa(flags, hwcpu, __pa(vpa)); | |
271 | ||
272 | if (ret) | |
273 | printk(KERN_ERR "WARNING: vpa_init: VPA registration for " | |
274 | "cpu %d (hw %d) of area %lx returns %ld\n", | |
275 | cpu, hwcpu, __pa(vpa), ret); | |
276 | } | |
277 | ||
278 | long pSeries_lpar_hpte_insert(unsigned long hpte_group, | |
279 | unsigned long va, unsigned long prpn, | |
96e28449 | 280 | unsigned long vflags, unsigned long rflags) |
1da177e4 LT |
281 | { |
282 | unsigned long arpn = physRpn_to_absRpn(prpn); | |
283 | unsigned long lpar_rc; | |
284 | unsigned long flags; | |
285 | unsigned long slot; | |
96e28449 | 286 | unsigned long hpte_v, hpte_r; |
1da177e4 LT |
287 | unsigned long dummy0, dummy1; |
288 | ||
96e28449 DG |
289 | hpte_v = ((va >> 23) << HPTE_V_AVPN_SHIFT) | vflags | HPTE_V_VALID; |
290 | if (vflags & HPTE_V_LARGE) | |
291 | hpte_v &= ~(1UL << HPTE_V_AVPN_SHIFT); | |
1da177e4 | 292 | |
96e28449 | 293 | hpte_r = (arpn << HPTE_R_RPN_SHIFT) | rflags; |
1da177e4 LT |
294 | |
295 | /* Now fill in the actual HPTE */ | |
296 | /* Set CEC cookie to 0 */ | |
297 | /* Zero page = 0 */ | |
298 | /* I-cache Invalidate = 0 */ | |
299 | /* I-cache synchronize = 0 */ | |
300 | /* Exact = 0 */ | |
301 | flags = 0; | |
302 | ||
303 | /* XXX why is this here? - Anton */ | |
96e28449 DG |
304 | if (rflags & (_PAGE_GUARDED|_PAGE_NO_CACHE)) |
305 | hpte_r &= ~_PAGE_COHERENT; | |
1da177e4 | 306 | |
96e28449 DG |
307 | lpar_rc = plpar_hcall(H_ENTER, flags, hpte_group, hpte_v, |
308 | hpte_r, &slot, &dummy0, &dummy1); | |
1da177e4 LT |
309 | |
310 | if (unlikely(lpar_rc == H_PTEG_Full)) | |
311 | return -1; | |
312 | ||
313 | /* | |
314 | * Since we try and ioremap PHBs we don't own, the pte insert | |
315 | * will fail. However we must catch the failure in hash_page | |
316 | * or we will loop forever, so return -2 in this case. | |
317 | */ | |
318 | if (unlikely(lpar_rc != H_Success)) | |
319 | return -2; | |
320 | ||
321 | /* Because of iSeries, we have to pass down the secondary | |
322 | * bucket bit here as well | |
323 | */ | |
96e28449 | 324 | return (slot & 7) | (!!(vflags & HPTE_V_SECONDARY) << 3); |
1da177e4 LT |
325 | } |
326 | ||
327 | static DEFINE_SPINLOCK(pSeries_lpar_tlbie_lock); | |
328 | ||
329 | static long pSeries_lpar_hpte_remove(unsigned long hpte_group) | |
330 | { | |
331 | unsigned long slot_offset; | |
332 | unsigned long lpar_rc; | |
333 | int i; | |
334 | unsigned long dummy1, dummy2; | |
335 | ||
336 | /* pick a random slot to start at */ | |
337 | slot_offset = mftb() & 0x7; | |
338 | ||
339 | for (i = 0; i < HPTES_PER_GROUP; i++) { | |
340 | ||
341 | /* don't remove a bolted entry */ | |
342 | lpar_rc = plpar_pte_remove(H_ANDCOND, hpte_group + slot_offset, | |
343 | (0x1UL << 4), &dummy1, &dummy2); | |
344 | ||
345 | if (lpar_rc == H_Success) | |
346 | return i; | |
347 | ||
348 | BUG_ON(lpar_rc != H_Not_Found); | |
349 | ||
350 | slot_offset++; | |
351 | slot_offset &= 0x7; | |
352 | } | |
353 | ||
354 | return -1; | |
355 | } | |
356 | ||
357 | static void pSeries_lpar_hptab_clear(void) | |
358 | { | |
359 | unsigned long size_bytes = 1UL << ppc64_pft_size; | |
360 | unsigned long hpte_count = size_bytes >> 4; | |
361 | unsigned long dummy1, dummy2; | |
362 | int i; | |
363 | ||
364 | /* TODO: Use bulk call */ | |
365 | for (i = 0; i < hpte_count; i++) | |
366 | plpar_pte_remove(0, i, 0, &dummy1, &dummy2); | |
367 | } | |
368 | ||
369 | /* | |
370 | * NOTE: for updatepp ops we are fortunate that the linux "newpp" bits and | |
371 | * the low 3 bits of flags happen to line up. So no transform is needed. | |
372 | * We can probably optimize here and assume the high bits of newpp are | |
373 | * already zero. For now I am paranoid. | |
374 | */ | |
375 | static long pSeries_lpar_hpte_updatepp(unsigned long slot, unsigned long newpp, | |
376 | unsigned long va, int large, int local) | |
377 | { | |
378 | unsigned long lpar_rc; | |
379 | unsigned long flags = (newpp & 7) | H_AVPN; | |
380 | unsigned long avpn = va >> 23; | |
381 | ||
382 | if (large) | |
383 | avpn &= ~0x1UL; | |
384 | ||
385 | lpar_rc = plpar_pte_protect(flags, slot, (avpn << 7)); | |
386 | ||
387 | if (lpar_rc == H_Not_Found) | |
388 | return -1; | |
389 | ||
390 | BUG_ON(lpar_rc != H_Success); | |
391 | ||
392 | return 0; | |
393 | } | |
394 | ||
395 | static unsigned long pSeries_lpar_hpte_getword0(unsigned long slot) | |
396 | { | |
397 | unsigned long dword0; | |
398 | unsigned long lpar_rc; | |
399 | unsigned long dummy_word1; | |
400 | unsigned long flags; | |
401 | ||
402 | /* Read 1 pte at a time */ | |
403 | /* Do not need RPN to logical page translation */ | |
404 | /* No cross CEC PFT access */ | |
405 | flags = 0; | |
406 | ||
407 | lpar_rc = plpar_pte_read(flags, slot, &dword0, &dummy_word1); | |
408 | ||
409 | BUG_ON(lpar_rc != H_Success); | |
410 | ||
411 | return dword0; | |
412 | } | |
413 | ||
414 | static long pSeries_lpar_hpte_find(unsigned long vpn) | |
415 | { | |
416 | unsigned long hash; | |
417 | unsigned long i, j; | |
418 | long slot; | |
96e28449 | 419 | unsigned long hpte_v; |
1da177e4 LT |
420 | |
421 | hash = hpt_hash(vpn, 0); | |
422 | ||
423 | for (j = 0; j < 2; j++) { | |
424 | slot = (hash & htab_hash_mask) * HPTES_PER_GROUP; | |
425 | for (i = 0; i < HPTES_PER_GROUP; i++) { | |
96e28449 | 426 | hpte_v = pSeries_lpar_hpte_getword0(slot); |
1da177e4 | 427 | |
96e28449 DG |
428 | if ((HPTE_V_AVPN_VAL(hpte_v) == (vpn >> 11)) |
429 | && (hpte_v & HPTE_V_VALID) | |
430 | && (!!(hpte_v & HPTE_V_SECONDARY) == j)) { | |
1da177e4 LT |
431 | /* HPTE matches */ |
432 | if (j) | |
433 | slot = -slot; | |
434 | return slot; | |
435 | } | |
436 | ++slot; | |
437 | } | |
438 | hash = ~hash; | |
439 | } | |
440 | ||
441 | return -1; | |
442 | } | |
443 | ||
444 | static void pSeries_lpar_hpte_updateboltedpp(unsigned long newpp, | |
445 | unsigned long ea) | |
446 | { | |
447 | unsigned long lpar_rc; | |
448 | unsigned long vsid, va, vpn, flags; | |
449 | long slot; | |
450 | ||
451 | vsid = get_kernel_vsid(ea); | |
452 | va = (vsid << 28) | (ea & 0x0fffffff); | |
453 | vpn = va >> PAGE_SHIFT; | |
454 | ||
455 | slot = pSeries_lpar_hpte_find(vpn); | |
456 | BUG_ON(slot == -1); | |
457 | ||
458 | flags = newpp & 7; | |
459 | lpar_rc = plpar_pte_protect(flags, slot, 0); | |
460 | ||
461 | BUG_ON(lpar_rc != H_Success); | |
462 | } | |
463 | ||
464 | static void pSeries_lpar_hpte_invalidate(unsigned long slot, unsigned long va, | |
465 | int large, int local) | |
466 | { | |
467 | unsigned long avpn = va >> 23; | |
468 | unsigned long lpar_rc; | |
469 | unsigned long dummy1, dummy2; | |
470 | ||
471 | if (large) | |
472 | avpn &= ~0x1UL; | |
473 | ||
474 | lpar_rc = plpar_pte_remove(H_AVPN, slot, (avpn << 7), &dummy1, | |
475 | &dummy2); | |
476 | ||
477 | if (lpar_rc == H_Not_Found) | |
478 | return; | |
479 | ||
480 | BUG_ON(lpar_rc != H_Success); | |
481 | } | |
482 | ||
483 | /* | |
484 | * Take a spinlock around flushes to avoid bouncing the hypervisor tlbie | |
485 | * lock. | |
486 | */ | |
487 | void pSeries_lpar_flush_hash_range(unsigned long context, unsigned long number, | |
488 | int local) | |
489 | { | |
490 | int i; | |
491 | unsigned long flags = 0; | |
492 | struct ppc64_tlb_batch *batch = &__get_cpu_var(ppc64_tlb_batch); | |
493 | int lock_tlbie = !cpu_has_feature(CPU_FTR_LOCKLESS_TLBIE); | |
494 | ||
495 | if (lock_tlbie) | |
496 | spin_lock_irqsave(&pSeries_lpar_tlbie_lock, flags); | |
497 | ||
498 | for (i = 0; i < number; i++) | |
499 | flush_hash_page(context, batch->addr[i], batch->pte[i], local); | |
500 | ||
501 | if (lock_tlbie) | |
502 | spin_unlock_irqrestore(&pSeries_lpar_tlbie_lock, flags); | |
503 | } | |
504 | ||
505 | void hpte_init_lpar(void) | |
506 | { | |
507 | ppc_md.hpte_invalidate = pSeries_lpar_hpte_invalidate; | |
508 | ppc_md.hpte_updatepp = pSeries_lpar_hpte_updatepp; | |
509 | ppc_md.hpte_updateboltedpp = pSeries_lpar_hpte_updateboltedpp; | |
510 | ppc_md.hpte_insert = pSeries_lpar_hpte_insert; | |
511 | ppc_md.hpte_remove = pSeries_lpar_hpte_remove; | |
512 | ppc_md.flush_hash_range = pSeries_lpar_flush_hash_range; | |
513 | ppc_md.hpte_clear_all = pSeries_lpar_hptab_clear; | |
514 | ||
515 | htab_finish_init(); | |
516 | } |