1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef _ASM_X86_PARAVIRT_H
3 #define _ASM_X86_PARAVIRT_H
4 /* Various instructions on x86 need to be replaced for
5  * para-virtualization: those hooks are defined here. */
6 
7 #ifdef CONFIG_PARAVIRT
8 #include <asm/pgtable_types.h>
9 #include <asm/asm.h>
10 #include <asm/nospec-branch.h>
11 
12 #include <asm/paravirt_types.h>
13 
14 #ifndef __ASSEMBLY__
15 #include <linux/bug.h>
16 #include <linux/types.h>
17 #include <linux/cpumask.h>
18 #include <asm/frame.h>
19 
paravirt_sched_clock(void)20 static inline unsigned long long paravirt_sched_clock(void)
21 {
22 	return PVOP_CALL0(unsigned long long, time.sched_clock);
23 }
24 
25 struct static_key;
26 extern struct static_key paravirt_steal_enabled;
27 extern struct static_key paravirt_steal_rq_enabled;
28 
29 __visible void __native_queued_spin_unlock(struct qspinlock *lock);
30 bool pv_is_native_spin_unlock(void);
31 __visible bool __native_vcpu_is_preempted(long cpu);
32 bool pv_is_native_vcpu_is_preempted(void);
33 
paravirt_steal_clock(int cpu)34 static inline u64 paravirt_steal_clock(int cpu)
35 {
36 	return PVOP_CALL1(u64, time.steal_clock, cpu);
37 }
38 
39 /* The paravirtualized I/O functions */
slow_down_io(void)40 static inline void slow_down_io(void)
41 {
42 	pv_ops.cpu.io_delay();
43 #ifdef REALLY_SLOW_IO
44 	pv_ops.cpu.io_delay();
45 	pv_ops.cpu.io_delay();
46 	pv_ops.cpu.io_delay();
47 #endif
48 }
49 
__flush_tlb(void)50 static inline void __flush_tlb(void)
51 {
52 	PVOP_VCALL0(mmu.flush_tlb_user);
53 }
54 
__flush_tlb_global(void)55 static inline void __flush_tlb_global(void)
56 {
57 	PVOP_VCALL0(mmu.flush_tlb_kernel);
58 }
59 
__flush_tlb_one_user(unsigned long addr)60 static inline void __flush_tlb_one_user(unsigned long addr)
61 {
62 	PVOP_VCALL1(mmu.flush_tlb_one_user, addr);
63 }
64 
flush_tlb_others(const struct cpumask * cpumask,const struct flush_tlb_info * info)65 static inline void flush_tlb_others(const struct cpumask *cpumask,
66 				    const struct flush_tlb_info *info)
67 {
68 	PVOP_VCALL2(mmu.flush_tlb_others, cpumask, info);
69 }
70 
paravirt_tlb_remove_table(struct mmu_gather * tlb,void * table)71 static inline void paravirt_tlb_remove_table(struct mmu_gather *tlb, void *table)
72 {
73 	PVOP_VCALL2(mmu.tlb_remove_table, tlb, table);
74 }
75 
paravirt_arch_exit_mmap(struct mm_struct * mm)76 static inline void paravirt_arch_exit_mmap(struct mm_struct *mm)
77 {
78 	PVOP_VCALL1(mmu.exit_mmap, mm);
79 }
80 
81 #ifdef CONFIG_PARAVIRT_XXL
load_sp0(unsigned long sp0)82 static inline void load_sp0(unsigned long sp0)
83 {
84 	PVOP_VCALL1(cpu.load_sp0, sp0);
85 }
86 
87 /* The paravirtualized CPUID instruction. */
__cpuid(unsigned int * eax,unsigned int * ebx,unsigned int * ecx,unsigned int * edx)88 static inline void __cpuid(unsigned int *eax, unsigned int *ebx,
89 			   unsigned int *ecx, unsigned int *edx)
90 {
91 	PVOP_VCALL4(cpu.cpuid, eax, ebx, ecx, edx);
92 }
93 
94 /*
95  * These special macros can be used to get or set a debugging register
96  */
paravirt_get_debugreg(int reg)97 static inline unsigned long paravirt_get_debugreg(int reg)
98 {
99 	return PVOP_CALL1(unsigned long, cpu.get_debugreg, reg);
100 }
101 #define get_debugreg(var, reg) var = paravirt_get_debugreg(reg)
set_debugreg(unsigned long val,int reg)102 static inline void set_debugreg(unsigned long val, int reg)
103 {
104 	PVOP_VCALL2(cpu.set_debugreg, reg, val);
105 }
106 
read_cr0(void)107 static inline unsigned long read_cr0(void)
108 {
109 	return PVOP_CALL0(unsigned long, cpu.read_cr0);
110 }
111 
write_cr0(unsigned long x)112 static inline void write_cr0(unsigned long x)
113 {
114 	PVOP_VCALL1(cpu.write_cr0, x);
115 }
116 
read_cr2(void)117 static inline unsigned long read_cr2(void)
118 {
119 	return PVOP_CALLEE0(unsigned long, mmu.read_cr2);
120 }
121 
write_cr2(unsigned long x)122 static inline void write_cr2(unsigned long x)
123 {
124 	PVOP_VCALL1(mmu.write_cr2, x);
125 }
126 
__read_cr3(void)127 static inline unsigned long __read_cr3(void)
128 {
129 	return PVOP_CALL0(unsigned long, mmu.read_cr3);
130 }
131 
write_cr3(unsigned long x)132 static inline void write_cr3(unsigned long x)
133 {
134 	PVOP_VCALL1(mmu.write_cr3, x);
135 }
136 
__write_cr4(unsigned long x)137 static inline void __write_cr4(unsigned long x)
138 {
139 	PVOP_VCALL1(cpu.write_cr4, x);
140 }
141 
arch_safe_halt(void)142 static inline void arch_safe_halt(void)
143 {
144 	PVOP_VCALL0(irq.safe_halt);
145 }
146 
halt(void)147 static inline void halt(void)
148 {
149 	PVOP_VCALL0(irq.halt);
150 }
151 
wbinvd(void)152 static inline void wbinvd(void)
153 {
154 	PVOP_VCALL0(cpu.wbinvd);
155 }
156 
157 #define get_kernel_rpl()  (pv_info.kernel_rpl)
158 
paravirt_read_msr(unsigned msr)159 static inline u64 paravirt_read_msr(unsigned msr)
160 {
161 	return PVOP_CALL1(u64, cpu.read_msr, msr);
162 }
163 
paravirt_write_msr(unsigned msr,unsigned low,unsigned high)164 static inline void paravirt_write_msr(unsigned msr,
165 				      unsigned low, unsigned high)
166 {
167 	PVOP_VCALL3(cpu.write_msr, msr, low, high);
168 }
169 
paravirt_read_msr_safe(unsigned msr,int * err)170 static inline u64 paravirt_read_msr_safe(unsigned msr, int *err)
171 {
172 	return PVOP_CALL2(u64, cpu.read_msr_safe, msr, err);
173 }
174 
paravirt_write_msr_safe(unsigned msr,unsigned low,unsigned high)175 static inline int paravirt_write_msr_safe(unsigned msr,
176 					  unsigned low, unsigned high)
177 {
178 	return PVOP_CALL3(int, cpu.write_msr_safe, msr, low, high);
179 }
180 
181 #define rdmsr(msr, val1, val2)			\
182 do {						\
183 	u64 _l = paravirt_read_msr(msr);	\
184 	val1 = (u32)_l;				\
185 	val2 = _l >> 32;			\
186 } while (0)
187 
188 #define wrmsr(msr, val1, val2)			\
189 do {						\
190 	paravirt_write_msr(msr, val1, val2);	\
191 } while (0)
192 
193 #define rdmsrl(msr, val)			\
194 do {						\
195 	val = paravirt_read_msr(msr);		\
196 } while (0)
197 
wrmsrl(unsigned msr,u64 val)198 static inline void wrmsrl(unsigned msr, u64 val)
199 {
200 	wrmsr(msr, (u32)val, (u32)(val>>32));
201 }
202 
203 #define wrmsr_safe(msr, a, b)	paravirt_write_msr_safe(msr, a, b)
204 
205 /* rdmsr with exception handling */
206 #define rdmsr_safe(msr, a, b)				\
207 ({							\
208 	int _err;					\
209 	u64 _l = paravirt_read_msr_safe(msr, &_err);	\
210 	(*a) = (u32)_l;					\
211 	(*b) = _l >> 32;				\
212 	_err;						\
213 })
214 
rdmsrl_safe(unsigned msr,unsigned long long * p)215 static inline int rdmsrl_safe(unsigned msr, unsigned long long *p)
216 {
217 	int err;
218 
219 	*p = paravirt_read_msr_safe(msr, &err);
220 	return err;
221 }
222 
paravirt_read_pmc(int counter)223 static inline unsigned long long paravirt_read_pmc(int counter)
224 {
225 	return PVOP_CALL1(u64, cpu.read_pmc, counter);
226 }
227 
228 #define rdpmc(counter, low, high)		\
229 do {						\
230 	u64 _l = paravirt_read_pmc(counter);	\
231 	low = (u32)_l;				\
232 	high = _l >> 32;			\
233 } while (0)
234 
235 #define rdpmcl(counter, val) ((val) = paravirt_read_pmc(counter))
236 
paravirt_alloc_ldt(struct desc_struct * ldt,unsigned entries)237 static inline void paravirt_alloc_ldt(struct desc_struct *ldt, unsigned entries)
238 {
239 	PVOP_VCALL2(cpu.alloc_ldt, ldt, entries);
240 }
241 
paravirt_free_ldt(struct desc_struct * ldt,unsigned entries)242 static inline void paravirt_free_ldt(struct desc_struct *ldt, unsigned entries)
243 {
244 	PVOP_VCALL2(cpu.free_ldt, ldt, entries);
245 }
246 
load_TR_desc(void)247 static inline void load_TR_desc(void)
248 {
249 	PVOP_VCALL0(cpu.load_tr_desc);
250 }
load_gdt(const struct desc_ptr * dtr)251 static inline void load_gdt(const struct desc_ptr *dtr)
252 {
253 	PVOP_VCALL1(cpu.load_gdt, dtr);
254 }
load_idt(const struct desc_ptr * dtr)255 static inline void load_idt(const struct desc_ptr *dtr)
256 {
257 	PVOP_VCALL1(cpu.load_idt, dtr);
258 }
set_ldt(const void * addr,unsigned entries)259 static inline void set_ldt(const void *addr, unsigned entries)
260 {
261 	PVOP_VCALL2(cpu.set_ldt, addr, entries);
262 }
paravirt_store_tr(void)263 static inline unsigned long paravirt_store_tr(void)
264 {
265 	return PVOP_CALL0(unsigned long, cpu.store_tr);
266 }
267 
268 #define store_tr(tr)	((tr) = paravirt_store_tr())
load_TLS(struct thread_struct * t,unsigned cpu)269 static inline void load_TLS(struct thread_struct *t, unsigned cpu)
270 {
271 	PVOP_VCALL2(cpu.load_tls, t, cpu);
272 }
273 
274 #ifdef CONFIG_X86_64
load_gs_index(unsigned int gs)275 static inline void load_gs_index(unsigned int gs)
276 {
277 	PVOP_VCALL1(cpu.load_gs_index, gs);
278 }
279 #endif
280 
write_ldt_entry(struct desc_struct * dt,int entry,const void * desc)281 static inline void write_ldt_entry(struct desc_struct *dt, int entry,
282 				   const void *desc)
283 {
284 	PVOP_VCALL3(cpu.write_ldt_entry, dt, entry, desc);
285 }
286 
write_gdt_entry(struct desc_struct * dt,int entry,void * desc,int type)287 static inline void write_gdt_entry(struct desc_struct *dt, int entry,
288 				   void *desc, int type)
289 {
290 	PVOP_VCALL4(cpu.write_gdt_entry, dt, entry, desc, type);
291 }
292 
write_idt_entry(gate_desc * dt,int entry,const gate_desc * g)293 static inline void write_idt_entry(gate_desc *dt, int entry, const gate_desc *g)
294 {
295 	PVOP_VCALL3(cpu.write_idt_entry, dt, entry, g);
296 }
set_iopl_mask(unsigned mask)297 static inline void set_iopl_mask(unsigned mask)
298 {
299 	PVOP_VCALL1(cpu.set_iopl_mask, mask);
300 }
301 
paravirt_activate_mm(struct mm_struct * prev,struct mm_struct * next)302 static inline void paravirt_activate_mm(struct mm_struct *prev,
303 					struct mm_struct *next)
304 {
305 	PVOP_VCALL2(mmu.activate_mm, prev, next);
306 }
307 
paravirt_arch_dup_mmap(struct mm_struct * oldmm,struct mm_struct * mm)308 static inline void paravirt_arch_dup_mmap(struct mm_struct *oldmm,
309 					  struct mm_struct *mm)
310 {
311 	PVOP_VCALL2(mmu.dup_mmap, oldmm, mm);
312 }
313 
paravirt_pgd_alloc(struct mm_struct * mm)314 static inline int paravirt_pgd_alloc(struct mm_struct *mm)
315 {
316 	return PVOP_CALL1(int, mmu.pgd_alloc, mm);
317 }
318 
paravirt_pgd_free(struct mm_struct * mm,pgd_t * pgd)319 static inline void paravirt_pgd_free(struct mm_struct *mm, pgd_t *pgd)
320 {
321 	PVOP_VCALL2(mmu.pgd_free, mm, pgd);
322 }
323 
paravirt_alloc_pte(struct mm_struct * mm,unsigned long pfn)324 static inline void paravirt_alloc_pte(struct mm_struct *mm, unsigned long pfn)
325 {
326 	PVOP_VCALL2(mmu.alloc_pte, mm, pfn);
327 }
paravirt_release_pte(unsigned long pfn)328 static inline void paravirt_release_pte(unsigned long pfn)
329 {
330 	PVOP_VCALL1(mmu.release_pte, pfn);
331 }
332 
paravirt_alloc_pmd(struct mm_struct * mm,unsigned long pfn)333 static inline void paravirt_alloc_pmd(struct mm_struct *mm, unsigned long pfn)
334 {
335 	PVOP_VCALL2(mmu.alloc_pmd, mm, pfn);
336 }
337 
paravirt_release_pmd(unsigned long pfn)338 static inline void paravirt_release_pmd(unsigned long pfn)
339 {
340 	PVOP_VCALL1(mmu.release_pmd, pfn);
341 }
342 
paravirt_alloc_pud(struct mm_struct * mm,unsigned long pfn)343 static inline void paravirt_alloc_pud(struct mm_struct *mm, unsigned long pfn)
344 {
345 	PVOP_VCALL2(mmu.alloc_pud, mm, pfn);
346 }
paravirt_release_pud(unsigned long pfn)347 static inline void paravirt_release_pud(unsigned long pfn)
348 {
349 	PVOP_VCALL1(mmu.release_pud, pfn);
350 }
351 
paravirt_alloc_p4d(struct mm_struct * mm,unsigned long pfn)352 static inline void paravirt_alloc_p4d(struct mm_struct *mm, unsigned long pfn)
353 {
354 	PVOP_VCALL2(mmu.alloc_p4d, mm, pfn);
355 }
356 
paravirt_release_p4d(unsigned long pfn)357 static inline void paravirt_release_p4d(unsigned long pfn)
358 {
359 	PVOP_VCALL1(mmu.release_p4d, pfn);
360 }
361 
__pte(pteval_t val)362 static inline pte_t __pte(pteval_t val)
363 {
364 	pteval_t ret;
365 
366 	if (sizeof(pteval_t) > sizeof(long))
367 		ret = PVOP_CALLEE2(pteval_t, mmu.make_pte, val, (u64)val >> 32);
368 	else
369 		ret = PVOP_CALLEE1(pteval_t, mmu.make_pte, val);
370 
371 	return (pte_t) { .pte = ret };
372 }
373 
pte_val(pte_t pte)374 static inline pteval_t pte_val(pte_t pte)
375 {
376 	pteval_t ret;
377 
378 	if (sizeof(pteval_t) > sizeof(long))
379 		ret = PVOP_CALLEE2(pteval_t, mmu.pte_val,
380 				   pte.pte, (u64)pte.pte >> 32);
381 	else
382 		ret = PVOP_CALLEE1(pteval_t, mmu.pte_val, pte.pte);
383 
384 	return ret;
385 }
386 
__pgd(pgdval_t val)387 static inline pgd_t __pgd(pgdval_t val)
388 {
389 	pgdval_t ret;
390 
391 	if (sizeof(pgdval_t) > sizeof(long))
392 		ret = PVOP_CALLEE2(pgdval_t, mmu.make_pgd, val, (u64)val >> 32);
393 	else
394 		ret = PVOP_CALLEE1(pgdval_t, mmu.make_pgd, val);
395 
396 	return (pgd_t) { ret };
397 }
398 
pgd_val(pgd_t pgd)399 static inline pgdval_t pgd_val(pgd_t pgd)
400 {
401 	pgdval_t ret;
402 
403 	if (sizeof(pgdval_t) > sizeof(long))
404 		ret =  PVOP_CALLEE2(pgdval_t, mmu.pgd_val,
405 				    pgd.pgd, (u64)pgd.pgd >> 32);
406 	else
407 		ret =  PVOP_CALLEE1(pgdval_t, mmu.pgd_val, pgd.pgd);
408 
409 	return ret;
410 }
411 
412 #define  __HAVE_ARCH_PTEP_MODIFY_PROT_TRANSACTION
ptep_modify_prot_start(struct vm_area_struct * vma,unsigned long addr,pte_t * ptep)413 static inline pte_t ptep_modify_prot_start(struct vm_area_struct *vma, unsigned long addr,
414 					   pte_t *ptep)
415 {
416 	pteval_t ret;
417 
418 	ret = PVOP_CALL3(pteval_t, mmu.ptep_modify_prot_start, vma, addr, ptep);
419 
420 	return (pte_t) { .pte = ret };
421 }
422 
ptep_modify_prot_commit(struct vm_area_struct * vma,unsigned long addr,pte_t * ptep,pte_t old_pte,pte_t pte)423 static inline void ptep_modify_prot_commit(struct vm_area_struct *vma, unsigned long addr,
424 					   pte_t *ptep, pte_t old_pte, pte_t pte)
425 {
426 
427 	if (sizeof(pteval_t) > sizeof(long))
428 		/* 5 arg words */
429 		pv_ops.mmu.ptep_modify_prot_commit(vma, addr, ptep, pte);
430 	else
431 		PVOP_VCALL4(mmu.ptep_modify_prot_commit,
432 			    vma, addr, ptep, pte.pte);
433 }
434 
set_pte(pte_t * ptep,pte_t pte)435 static inline void set_pte(pte_t *ptep, pte_t pte)
436 {
437 	if (sizeof(pteval_t) > sizeof(long))
438 		PVOP_VCALL3(mmu.set_pte, ptep, pte.pte, (u64)pte.pte >> 32);
439 	else
440 		PVOP_VCALL2(mmu.set_pte, ptep, pte.pte);
441 }
442 
set_pte_at(struct mm_struct * mm,unsigned long addr,pte_t * ptep,pte_t pte)443 static inline void set_pte_at(struct mm_struct *mm, unsigned long addr,
444 			      pte_t *ptep, pte_t pte)
445 {
446 	if (sizeof(pteval_t) > sizeof(long))
447 		/* 5 arg words */
448 		pv_ops.mmu.set_pte_at(mm, addr, ptep, pte);
449 	else
450 		PVOP_VCALL4(mmu.set_pte_at, mm, addr, ptep, pte.pte);
451 }
452 
set_pmd(pmd_t * pmdp,pmd_t pmd)453 static inline void set_pmd(pmd_t *pmdp, pmd_t pmd)
454 {
455 	pmdval_t val = native_pmd_val(pmd);
456 
457 	if (sizeof(pmdval_t) > sizeof(long))
458 		PVOP_VCALL3(mmu.set_pmd, pmdp, val, (u64)val >> 32);
459 	else
460 		PVOP_VCALL2(mmu.set_pmd, pmdp, val);
461 }
462 
463 #if CONFIG_PGTABLE_LEVELS >= 3
__pmd(pmdval_t val)464 static inline pmd_t __pmd(pmdval_t val)
465 {
466 	pmdval_t ret;
467 
468 	if (sizeof(pmdval_t) > sizeof(long))
469 		ret = PVOP_CALLEE2(pmdval_t, mmu.make_pmd, val, (u64)val >> 32);
470 	else
471 		ret = PVOP_CALLEE1(pmdval_t, mmu.make_pmd, val);
472 
473 	return (pmd_t) { ret };
474 }
475 
pmd_val(pmd_t pmd)476 static inline pmdval_t pmd_val(pmd_t pmd)
477 {
478 	pmdval_t ret;
479 
480 	if (sizeof(pmdval_t) > sizeof(long))
481 		ret =  PVOP_CALLEE2(pmdval_t, mmu.pmd_val,
482 				    pmd.pmd, (u64)pmd.pmd >> 32);
483 	else
484 		ret =  PVOP_CALLEE1(pmdval_t, mmu.pmd_val, pmd.pmd);
485 
486 	return ret;
487 }
488 
set_pud(pud_t * pudp,pud_t pud)489 static inline void set_pud(pud_t *pudp, pud_t pud)
490 {
491 	pudval_t val = native_pud_val(pud);
492 
493 	if (sizeof(pudval_t) > sizeof(long))
494 		PVOP_VCALL3(mmu.set_pud, pudp, val, (u64)val >> 32);
495 	else
496 		PVOP_VCALL2(mmu.set_pud, pudp, val);
497 }
498 #if CONFIG_PGTABLE_LEVELS >= 4
__pud(pudval_t val)499 static inline pud_t __pud(pudval_t val)
500 {
501 	pudval_t ret;
502 
503 	ret = PVOP_CALLEE1(pudval_t, mmu.make_pud, val);
504 
505 	return (pud_t) { ret };
506 }
507 
pud_val(pud_t pud)508 static inline pudval_t pud_val(pud_t pud)
509 {
510 	return PVOP_CALLEE1(pudval_t, mmu.pud_val, pud.pud);
511 }
512 
pud_clear(pud_t * pudp)513 static inline void pud_clear(pud_t *pudp)
514 {
515 	set_pud(pudp, __pud(0));
516 }
517 
set_p4d(p4d_t * p4dp,p4d_t p4d)518 static inline void set_p4d(p4d_t *p4dp, p4d_t p4d)
519 {
520 	p4dval_t val = native_p4d_val(p4d);
521 
522 	PVOP_VCALL2(mmu.set_p4d, p4dp, val);
523 }
524 
525 #if CONFIG_PGTABLE_LEVELS >= 5
526 
__p4d(p4dval_t val)527 static inline p4d_t __p4d(p4dval_t val)
528 {
529 	p4dval_t ret = PVOP_CALLEE1(p4dval_t, mmu.make_p4d, val);
530 
531 	return (p4d_t) { ret };
532 }
533 
p4d_val(p4d_t p4d)534 static inline p4dval_t p4d_val(p4d_t p4d)
535 {
536 	return PVOP_CALLEE1(p4dval_t, mmu.p4d_val, p4d.p4d);
537 }
538 
__set_pgd(pgd_t * pgdp,pgd_t pgd)539 static inline void __set_pgd(pgd_t *pgdp, pgd_t pgd)
540 {
541 	PVOP_VCALL2(mmu.set_pgd, pgdp, native_pgd_val(pgd));
542 }
543 
544 #define set_pgd(pgdp, pgdval) do {					\
545 	if (pgtable_l5_enabled())						\
546 		__set_pgd(pgdp, pgdval);				\
547 	else								\
548 		set_p4d((p4d_t *)(pgdp), (p4d_t) { (pgdval).pgd });	\
549 } while (0)
550 
551 #define pgd_clear(pgdp) do {						\
552 	if (pgtable_l5_enabled())						\
553 		set_pgd(pgdp, __pgd(0));				\
554 } while (0)
555 
556 #endif  /* CONFIG_PGTABLE_LEVELS == 5 */
557 
p4d_clear(p4d_t * p4dp)558 static inline void p4d_clear(p4d_t *p4dp)
559 {
560 	set_p4d(p4dp, __p4d(0));
561 }
562 
563 #endif	/* CONFIG_PGTABLE_LEVELS == 4 */
564 
565 #endif	/* CONFIG_PGTABLE_LEVELS >= 3 */
566 
567 #ifdef CONFIG_X86_PAE
568 /* Special-case pte-setting operations for PAE, which can't update a
569    64-bit pte atomically */
set_pte_atomic(pte_t * ptep,pte_t pte)570 static inline void set_pte_atomic(pte_t *ptep, pte_t pte)
571 {
572 	PVOP_VCALL3(mmu.set_pte_atomic, ptep, pte.pte, pte.pte >> 32);
573 }
574 
pte_clear(struct mm_struct * mm,unsigned long addr,pte_t * ptep)575 static inline void pte_clear(struct mm_struct *mm, unsigned long addr,
576 			     pte_t *ptep)
577 {
578 	PVOP_VCALL3(mmu.pte_clear, mm, addr, ptep);
579 }
580 
pmd_clear(pmd_t * pmdp)581 static inline void pmd_clear(pmd_t *pmdp)
582 {
583 	PVOP_VCALL1(mmu.pmd_clear, pmdp);
584 }
585 #else  /* !CONFIG_X86_PAE */
set_pte_atomic(pte_t * ptep,pte_t pte)586 static inline void set_pte_atomic(pte_t *ptep, pte_t pte)
587 {
588 	set_pte(ptep, pte);
589 }
590 
pte_clear(struct mm_struct * mm,unsigned long addr,pte_t * ptep)591 static inline void pte_clear(struct mm_struct *mm, unsigned long addr,
592 			     pte_t *ptep)
593 {
594 	set_pte_at(mm, addr, ptep, __pte(0));
595 }
596 
pmd_clear(pmd_t * pmdp)597 static inline void pmd_clear(pmd_t *pmdp)
598 {
599 	set_pmd(pmdp, __pmd(0));
600 }
601 #endif	/* CONFIG_X86_PAE */
602 
603 #define  __HAVE_ARCH_START_CONTEXT_SWITCH
arch_start_context_switch(struct task_struct * prev)604 static inline void arch_start_context_switch(struct task_struct *prev)
605 {
606 	PVOP_VCALL1(cpu.start_context_switch, prev);
607 }
608 
arch_end_context_switch(struct task_struct * next)609 static inline void arch_end_context_switch(struct task_struct *next)
610 {
611 	PVOP_VCALL1(cpu.end_context_switch, next);
612 }
613 
614 #define  __HAVE_ARCH_ENTER_LAZY_MMU_MODE
arch_enter_lazy_mmu_mode(void)615 static inline void arch_enter_lazy_mmu_mode(void)
616 {
617 	PVOP_VCALL0(mmu.lazy_mode.enter);
618 }
619 
arch_leave_lazy_mmu_mode(void)620 static inline void arch_leave_lazy_mmu_mode(void)
621 {
622 	PVOP_VCALL0(mmu.lazy_mode.leave);
623 }
624 
arch_flush_lazy_mmu_mode(void)625 static inline void arch_flush_lazy_mmu_mode(void)
626 {
627 	PVOP_VCALL0(mmu.lazy_mode.flush);
628 }
629 
__set_fixmap(unsigned idx,phys_addr_t phys,pgprot_t flags)630 static inline void __set_fixmap(unsigned /* enum fixed_addresses */ idx,
631 				phys_addr_t phys, pgprot_t flags)
632 {
633 	pv_ops.mmu.set_fixmap(idx, phys, flags);
634 }
635 #endif
636 
637 #if defined(CONFIG_SMP) && defined(CONFIG_PARAVIRT_SPINLOCKS)
638 
pv_queued_spin_lock_slowpath(struct qspinlock * lock,u32 val)639 static __always_inline void pv_queued_spin_lock_slowpath(struct qspinlock *lock,
640 							u32 val)
641 {
642 	PVOP_VCALL2(lock.queued_spin_lock_slowpath, lock, val);
643 }
644 
pv_queued_spin_unlock(struct qspinlock * lock)645 static __always_inline void pv_queued_spin_unlock(struct qspinlock *lock)
646 {
647 	PVOP_VCALLEE1(lock.queued_spin_unlock, lock);
648 }
649 
pv_wait(u8 * ptr,u8 val)650 static __always_inline void pv_wait(u8 *ptr, u8 val)
651 {
652 	PVOP_VCALL2(lock.wait, ptr, val);
653 }
654 
pv_kick(int cpu)655 static __always_inline void pv_kick(int cpu)
656 {
657 	PVOP_VCALL1(lock.kick, cpu);
658 }
659 
pv_vcpu_is_preempted(long cpu)660 static __always_inline bool pv_vcpu_is_preempted(long cpu)
661 {
662 	return PVOP_CALLEE1(bool, lock.vcpu_is_preempted, cpu);
663 }
664 
665 void __raw_callee_save___native_queued_spin_unlock(struct qspinlock *lock);
666 bool __raw_callee_save___native_vcpu_is_preempted(long cpu);
667 
668 #endif /* SMP && PARAVIRT_SPINLOCKS */
669 
670 #ifdef CONFIG_X86_32
671 #define PV_SAVE_REGS "pushl %ecx; pushl %edx;"
672 #define PV_RESTORE_REGS "popl %edx; popl %ecx;"
673 
674 /* save and restore all caller-save registers, except return value */
675 #define PV_SAVE_ALL_CALLER_REGS		"pushl %ecx;"
676 #define PV_RESTORE_ALL_CALLER_REGS	"popl  %ecx;"
677 
678 #define PV_FLAGS_ARG "0"
679 #define PV_EXTRA_CLOBBERS
680 #define PV_VEXTRA_CLOBBERS
681 #else
682 /* save and restore all caller-save registers, except return value */
683 #define PV_SAVE_ALL_CALLER_REGS						\
684 	"push %rcx;"							\
685 	"push %rdx;"							\
686 	"push %rsi;"							\
687 	"push %rdi;"							\
688 	"push %r8;"							\
689 	"push %r9;"							\
690 	"push %r10;"							\
691 	"push %r11;"
692 #define PV_RESTORE_ALL_CALLER_REGS					\
693 	"pop %r11;"							\
694 	"pop %r10;"							\
695 	"pop %r9;"							\
696 	"pop %r8;"							\
697 	"pop %rdi;"							\
698 	"pop %rsi;"							\
699 	"pop %rdx;"							\
700 	"pop %rcx;"
701 
702 /* We save some registers, but all of them, that's too much. We clobber all
703  * caller saved registers but the argument parameter */
704 #define PV_SAVE_REGS "pushq %%rdi;"
705 #define PV_RESTORE_REGS "popq %%rdi;"
706 #define PV_EXTRA_CLOBBERS EXTRA_CLOBBERS, "rcx" , "rdx", "rsi"
707 #define PV_VEXTRA_CLOBBERS EXTRA_CLOBBERS, "rdi", "rcx" , "rdx", "rsi"
708 #define PV_FLAGS_ARG "D"
709 #endif
710 
711 /*
712  * Generate a thunk around a function which saves all caller-save
713  * registers except for the return value.  This allows C functions to
714  * be called from assembler code where fewer than normal registers are
715  * available.  It may also help code generation around calls from C
716  * code if the common case doesn't use many registers.
717  *
718  * When a callee is wrapped in a thunk, the caller can assume that all
719  * arg regs and all scratch registers are preserved across the
720  * call. The return value in rax/eax will not be saved, even for void
721  * functions.
722  */
723 #define PV_THUNK_NAME(func) "__raw_callee_save_" #func
724 #define PV_CALLEE_SAVE_REGS_THUNK(func)					\
725 	extern typeof(func) __raw_callee_save_##func;			\
726 									\
727 	asm(".pushsection .text;"					\
728 	    ".globl " PV_THUNK_NAME(func) ";"				\
729 	    ".type " PV_THUNK_NAME(func) ", @function;"			\
730 	    PV_THUNK_NAME(func) ":"					\
731 	    FRAME_BEGIN							\
732 	    PV_SAVE_ALL_CALLER_REGS					\
733 	    "call " #func ";"						\
734 	    PV_RESTORE_ALL_CALLER_REGS					\
735 	    FRAME_END							\
736 	    "ret;"							\
737 	    ".size " PV_THUNK_NAME(func) ", .-" PV_THUNK_NAME(func) ";"	\
738 	    ".popsection")
739 
740 /* Get a reference to a callee-save function */
741 #define PV_CALLEE_SAVE(func)						\
742 	((struct paravirt_callee_save) { __raw_callee_save_##func })
743 
744 /* Promise that "func" already uses the right calling convention */
745 #define __PV_IS_CALLEE_SAVE(func)			\
746 	((struct paravirt_callee_save) { func })
747 
748 #ifdef CONFIG_PARAVIRT_XXL
arch_local_save_flags(void)749 static inline notrace unsigned long arch_local_save_flags(void)
750 {
751 	return PVOP_CALLEE0(unsigned long, irq.save_fl);
752 }
753 
arch_local_irq_restore(unsigned long f)754 static inline notrace void arch_local_irq_restore(unsigned long f)
755 {
756 	PVOP_VCALLEE1(irq.restore_fl, f);
757 }
758 
arch_local_irq_disable(void)759 static inline notrace void arch_local_irq_disable(void)
760 {
761 	PVOP_VCALLEE0(irq.irq_disable);
762 }
763 
arch_local_irq_enable(void)764 static inline notrace void arch_local_irq_enable(void)
765 {
766 	PVOP_VCALLEE0(irq.irq_enable);
767 }
768 
arch_local_irq_save(void)769 static inline notrace unsigned long arch_local_irq_save(void)
770 {
771 	unsigned long f;
772 
773 	f = arch_local_save_flags();
774 	arch_local_irq_disable();
775 	return f;
776 }
777 #endif
778 
779 
780 /* Make sure as little as possible of this mess escapes. */
781 #undef PARAVIRT_CALL
782 #undef __PVOP_CALL
783 #undef __PVOP_VCALL
784 #undef PVOP_VCALL0
785 #undef PVOP_CALL0
786 #undef PVOP_VCALL1
787 #undef PVOP_CALL1
788 #undef PVOP_VCALL2
789 #undef PVOP_CALL2
790 #undef PVOP_VCALL3
791 #undef PVOP_CALL3
792 #undef PVOP_VCALL4
793 #undef PVOP_CALL4
794 
795 extern void default_banner(void);
796 
797 #else  /* __ASSEMBLY__ */
798 
799 #define _PVSITE(ptype, ops, word, algn)		\
800 771:;						\
801 	ops;					\
802 772:;						\
803 	.pushsection .parainstructions,"a";	\
804 	 .align	algn;				\
805 	 word 771b;				\
806 	 .byte ptype;				\
807 	 .byte 772b-771b;			\
808 	.popsection
809 
810 
811 #define COND_PUSH(set, mask, reg)			\
812 	.if ((~(set)) & mask); push %reg; .endif
813 #define COND_POP(set, mask, reg)			\
814 	.if ((~(set)) & mask); pop %reg; .endif
815 
816 #ifdef CONFIG_X86_64
817 
818 #define PV_SAVE_REGS(set)			\
819 	COND_PUSH(set, CLBR_RAX, rax);		\
820 	COND_PUSH(set, CLBR_RCX, rcx);		\
821 	COND_PUSH(set, CLBR_RDX, rdx);		\
822 	COND_PUSH(set, CLBR_RSI, rsi);		\
823 	COND_PUSH(set, CLBR_RDI, rdi);		\
824 	COND_PUSH(set, CLBR_R8, r8);		\
825 	COND_PUSH(set, CLBR_R9, r9);		\
826 	COND_PUSH(set, CLBR_R10, r10);		\
827 	COND_PUSH(set, CLBR_R11, r11)
828 #define PV_RESTORE_REGS(set)			\
829 	COND_POP(set, CLBR_R11, r11);		\
830 	COND_POP(set, CLBR_R10, r10);		\
831 	COND_POP(set, CLBR_R9, r9);		\
832 	COND_POP(set, CLBR_R8, r8);		\
833 	COND_POP(set, CLBR_RDI, rdi);		\
834 	COND_POP(set, CLBR_RSI, rsi);		\
835 	COND_POP(set, CLBR_RDX, rdx);		\
836 	COND_POP(set, CLBR_RCX, rcx);		\
837 	COND_POP(set, CLBR_RAX, rax)
838 
839 #define PARA_PATCH(off)		((off) / 8)
840 #define PARA_SITE(ptype, ops)	_PVSITE(ptype, ops, .quad, 8)
841 #define PARA_INDIRECT(addr)	*addr(%rip)
842 #else
843 #define PV_SAVE_REGS(set)			\
844 	COND_PUSH(set, CLBR_EAX, eax);		\
845 	COND_PUSH(set, CLBR_EDI, edi);		\
846 	COND_PUSH(set, CLBR_ECX, ecx);		\
847 	COND_PUSH(set, CLBR_EDX, edx)
848 #define PV_RESTORE_REGS(set)			\
849 	COND_POP(set, CLBR_EDX, edx);		\
850 	COND_POP(set, CLBR_ECX, ecx);		\
851 	COND_POP(set, CLBR_EDI, edi);		\
852 	COND_POP(set, CLBR_EAX, eax)
853 
854 #define PARA_PATCH(off)		((off) / 4)
855 #define PARA_SITE(ptype, ops)	_PVSITE(ptype, ops, .long, 4)
856 #define PARA_INDIRECT(addr)	*%cs:addr
857 #endif
858 
859 #ifdef CONFIG_PARAVIRT_XXL
860 #define INTERRUPT_RETURN						\
861 	PARA_SITE(PARA_PATCH(PV_CPU_iret),				\
862 		  ANNOTATE_RETPOLINE_SAFE;				\
863 		  jmp PARA_INDIRECT(pv_ops+PV_CPU_iret);)
864 
865 #define DISABLE_INTERRUPTS(clobbers)					\
866 	PARA_SITE(PARA_PATCH(PV_IRQ_irq_disable),			\
867 		  PV_SAVE_REGS(clobbers | CLBR_CALLEE_SAVE);		\
868 		  ANNOTATE_RETPOLINE_SAFE;				\
869 		  call PARA_INDIRECT(pv_ops+PV_IRQ_irq_disable);	\
870 		  PV_RESTORE_REGS(clobbers | CLBR_CALLEE_SAVE);)
871 
872 #define ENABLE_INTERRUPTS(clobbers)					\
873 	PARA_SITE(PARA_PATCH(PV_IRQ_irq_enable),			\
874 		  PV_SAVE_REGS(clobbers | CLBR_CALLEE_SAVE);		\
875 		  ANNOTATE_RETPOLINE_SAFE;				\
876 		  call PARA_INDIRECT(pv_ops+PV_IRQ_irq_enable);		\
877 		  PV_RESTORE_REGS(clobbers | CLBR_CALLEE_SAVE);)
878 #endif
879 
880 #ifdef CONFIG_X86_64
881 #ifdef CONFIG_PARAVIRT_XXL
882 /*
883  * If swapgs is used while the userspace stack is still current,
884  * there's no way to call a pvop.  The PV replacement *must* be
885  * inlined, or the swapgs instruction must be trapped and emulated.
886  */
887 #define SWAPGS_UNSAFE_STACK						\
888 	PARA_SITE(PARA_PATCH(PV_CPU_swapgs), swapgs)
889 
890 /*
891  * Note: swapgs is very special, and in practise is either going to be
892  * implemented with a single "swapgs" instruction or something very
893  * special.  Either way, we don't need to save any registers for
894  * it.
895  */
896 #define SWAPGS								\
897 	PARA_SITE(PARA_PATCH(PV_CPU_swapgs),				\
898 		  ANNOTATE_RETPOLINE_SAFE;				\
899 		  call PARA_INDIRECT(pv_ops+PV_CPU_swapgs);		\
900 		 )
901 
902 #define USERGS_SYSRET64							\
903 	PARA_SITE(PARA_PATCH(PV_CPU_usergs_sysret64),			\
904 		  ANNOTATE_RETPOLINE_SAFE;				\
905 		  jmp PARA_INDIRECT(pv_ops+PV_CPU_usergs_sysret64);)
906 
907 #ifdef CONFIG_DEBUG_ENTRY
908 #define SAVE_FLAGS(clobbers)                                        \
909 	PARA_SITE(PARA_PATCH(PV_IRQ_save_fl),			    \
910 		  PV_SAVE_REGS(clobbers | CLBR_CALLEE_SAVE);        \
911 		  ANNOTATE_RETPOLINE_SAFE;			    \
912 		  call PARA_INDIRECT(pv_ops+PV_IRQ_save_fl);	    \
913 		  PV_RESTORE_REGS(clobbers | CLBR_CALLEE_SAVE);)
914 #endif
915 #endif /* CONFIG_PARAVIRT_XXL */
916 #endif	/* CONFIG_X86_64 */
917 
918 #ifdef CONFIG_PARAVIRT_XXL
919 
920 #define GET_CR2_INTO_AX							\
921 	PARA_SITE(PARA_PATCH(PV_MMU_read_cr2),				\
922 		  ANNOTATE_RETPOLINE_SAFE;				\
923 		  call PARA_INDIRECT(pv_ops+PV_MMU_read_cr2);		\
924 		 )
925 
926 #endif /* CONFIG_PARAVIRT_XXL */
927 
928 
929 #endif /* __ASSEMBLY__ */
930 #else  /* CONFIG_PARAVIRT */
931 # define default_banner x86_init_noop
932 #endif /* !CONFIG_PARAVIRT */
933 
934 #ifndef __ASSEMBLY__
935 #ifndef CONFIG_PARAVIRT_XXL
paravirt_arch_dup_mmap(struct mm_struct * oldmm,struct mm_struct * mm)936 static inline void paravirt_arch_dup_mmap(struct mm_struct *oldmm,
937 					  struct mm_struct *mm)
938 {
939 }
940 #endif
941 
942 #ifndef CONFIG_PARAVIRT
paravirt_arch_exit_mmap(struct mm_struct * mm)943 static inline void paravirt_arch_exit_mmap(struct mm_struct *mm)
944 {
945 }
946 #endif
947 #endif /* __ASSEMBLY__ */
948 #endif /* _ASM_X86_PARAVIRT_H */
949