Lines Matching +full:0 +full:x48
34 do { prog = emit_code(prog, bytes, len); } while (0)
42 do { EMIT1(b1); EMIT(off, 4); } while (0)
44 do { EMIT2(b1, b2); EMIT(off, 4); } while (0)
46 do { EMIT3(b1, b2, b3); EMIT(off, 4); } while (0)
48 do { EMIT4(b1, b2, b3, b4); EMIT(off, 4); } while (0)
69 EMIT3(add_2mod(0x48, DST, SRC), 0x89, add_2reg(0xC0, DST, SRC)); \
70 } while (0)
83 return 0; in bpf_size_to_x86_bytes()
88 * Add 0x10 (and an extra 0x0f) to generate far jumps (. + s32)
90 #define X86_JB 0x72
91 #define X86_JAE 0x73
92 #define X86_JE 0x74
93 #define X86_JNE 0x75
94 #define X86_JBE 0x76
95 #define X86_JA 0x77
96 #define X86_JL 0x7C
97 #define X86_JGE 0x7D
98 #define X86_JLE 0x7E
99 #define X86_JG 0x7F
116 [BPF_REG_0] = 0, /* RAX */
121 [BPF_REG_5] = 0, /* R8 */
210 [BPF_ADD] = 0x01,
211 [BPF_SUB] = 0x29,
212 [BPF_AND] = 0x21,
213 [BPF_OR] = 0x09,
214 [BPF_XOR] = 0x31,
215 [BPF_LSH] = 0xE0,
216 [BPF_RSH] = 0xE8,
217 [BPF_ARSH] = 0xF8,
223 memset(area, 0xcc, size); in jit_fill_hole()
243 if (callee_regs_used[0]) in push_callee_regs()
244 EMIT1(0x53); /* push rbx */ in push_callee_regs()
246 EMIT2(0x41, 0x55); /* push r13 */ in push_callee_regs()
248 EMIT2(0x41, 0x56); /* push r14 */ in push_callee_regs()
250 EMIT2(0x41, 0x57); /* push r15 */ in push_callee_regs()
259 EMIT2(0x41, 0x5F); /* pop r15 */ in pop_callee_regs()
261 EMIT2(0x41, 0x5E); /* pop r14 */ in pop_callee_regs()
263 EMIT2(0x41, 0x5D); /* pop r13 */ in pop_callee_regs()
264 if (callee_regs_used[0]) in pop_callee_regs()
265 EMIT1(0x5B); /* pop rbx */ in pop_callee_regs()
286 EMIT2(0x31, 0xC0); /* xor eax, eax */ in emit_prologue()
288 EMIT2(0x66, 0x90); /* nop2 */ in emit_prologue()
290 EMIT1(0x55); /* push rbp */ in emit_prologue()
291 EMIT3(0x48, 0x89, 0xE5); /* mov rbp, rsp */ in emit_prologue()
294 EMIT3_off32(0x48, 0x81, 0xEC, round_up(stack_depth, 8)); in emit_prologue()
296 EMIT1(0x50); /* push rax */ in emit_prologue()
312 return 0; in emit_patch()
317 return emit_patch(pprog, func, ip, 0xE8); in emit_call()
322 return emit_patch(pprog, func, ip, 0xE9); in emit_jump()
365 ret = 0; in __bpf_arch_text_poke()
385 int bytes = 0; in get_pop_bytes()
393 if (callee_regs_used[0]) in get_pop_bytes()
418 int pop_bytes = 0; in emit_bpf_tail_call_indirect()
448 EMIT2(0x89, 0xD2); /* mov edx, edx */ in emit_bpf_tail_call_indirect()
449 EMIT3(0x39, 0x56, /* cmp dword ptr [rsi + 16], edx */ in emit_bpf_tail_call_indirect()
458 EMIT2_off32(0x8B, 0x85, tcc_off); /* mov eax, dword ptr [rbp - tcc_off] */ in emit_bpf_tail_call_indirect()
459 EMIT3(0x83, 0xF8, MAX_TAIL_CALL_CNT); /* cmp eax, MAX_TAIL_CALL_CNT */ in emit_bpf_tail_call_indirect()
462 EMIT3(0x83, 0xC0, 0x01); /* add eax, 1 */ in emit_bpf_tail_call_indirect()
463 EMIT2_off32(0x89, 0x85, tcc_off); /* mov dword ptr [rbp - tcc_off], eax */ in emit_bpf_tail_call_indirect()
466 EMIT4_off32(0x48, 0x8B, 0x8C, 0xD6, /* mov rcx, [rsi + rdx * 8 + offsetof(...)] */ in emit_bpf_tail_call_indirect()
473 EMIT3(0x48, 0x85, 0xC9); /* test rcx,rcx */ in emit_bpf_tail_call_indirect()
481 EMIT1(0x58); /* pop rax */ in emit_bpf_tail_call_indirect()
483 EMIT3_off32(0x48, 0x81, 0xC4, /* add rsp, sd */ in emit_bpf_tail_call_indirect()
487 EMIT4(0x48, 0x8B, 0x49, /* mov rcx, qword ptr [rcx + 32] */ in emit_bpf_tail_call_indirect()
489 EMIT4(0x48, 0x83, 0xC1, /* add rcx, X86_TAIL_CALL_OFFSET */ in emit_bpf_tail_call_indirect()
508 int pop_bytes = 0; in emit_bpf_tail_call_direct()
523 * - sub rsp, $val if depth > 0 in emit_bpf_tail_call_direct()
536 EMIT2_off32(0x8B, 0x85, tcc_off); /* mov eax, dword ptr [rbp - tcc_off] */ in emit_bpf_tail_call_direct()
537 EMIT3(0x83, 0xF8, MAX_TAIL_CALL_CNT); /* cmp eax, MAX_TAIL_CALL_CNT */ in emit_bpf_tail_call_direct()
539 EMIT3(0x83, 0xC0, 0x01); /* add eax, 1 */ in emit_bpf_tail_call_direct()
540 EMIT2_off32(0x89, 0x85, tcc_off); /* mov dword ptr [rbp - tcc_off], eax */ in emit_bpf_tail_call_direct()
553 EMIT1(0x58); /* pop rax */ in emit_bpf_tail_call_direct()
555 EMIT3_off32(0x48, 0x81, 0xC4, round_up(stack_depth, 8)); in emit_bpf_tail_call_direct()
571 for (i = 0; i < prog->aux->size_poke_tab; i++) { in bpf_tail_call_direct_fixup()
598 BUG_ON(ret < 0); in bpf_tail_call_direct_fixup()
603 BUG_ON(ret < 0); in bpf_tail_call_direct_fixup()
620 if (sign_propagate && (s32)imm32 < 0) { in emit_mov_imm32()
622 b1 = add_1mod(0x48, dst_reg); in emit_mov_imm32()
623 b2 = 0xC7; in emit_mov_imm32()
624 b3 = 0xC0; in emit_mov_imm32()
633 if (imm32 == 0) { in emit_mov_imm32()
635 EMIT1(add_2mod(0x40, dst_reg, dst_reg)); in emit_mov_imm32()
636 b2 = 0x31; /* xor */ in emit_mov_imm32()
637 b3 = 0xC0; in emit_mov_imm32()
644 EMIT1(add_1mod(0x40, dst_reg)); in emit_mov_imm32()
645 EMIT1_off32(add_1reg(0xB8, dst_reg), imm32); in emit_mov_imm32()
665 EMIT2(add_1mod(0x48, dst_reg), add_1reg(0xB8, dst_reg)); in emit_mov_imm64()
683 EMIT1(add_2mod(0x40, dst_reg, src_reg)); in emit_mov_reg()
684 EMIT2(0x89, add_2reg(0xC0, dst_reg, src_reg)); in emit_mov_reg()
698 * If off == 0 we could skip this and save one extra byte, but in emit_insn_suffix()
702 EMIT2(add_2reg(0x40, ptr_reg, val_reg), off); in emit_insn_suffix()
705 EMIT1_off32(add_2reg(0x80, ptr_reg, val_reg), off); in emit_insn_suffix()
718 EMIT1(add_2mod(0x48, dst_reg, src_reg)); in maybe_emit_mod()
720 EMIT1(add_2mod(0x40, dst_reg, src_reg)); in maybe_emit_mod()
732 EMIT3(add_2mod(0x48, src_reg, dst_reg), 0x0F, 0xB6); in emit_ldx()
736 EMIT3(add_2mod(0x48, src_reg, dst_reg), 0x0F, 0xB7); in emit_ldx()
739 /* Emit 'mov eax, dword ptr [rax+0x14]' */ in emit_ldx()
741 EMIT2(add_2mod(0x40, src_reg, dst_reg), 0x8B); in emit_ldx()
743 EMIT1(0x8B); in emit_ldx()
746 /* Emit 'mov rax, qword ptr [rax+0x14]' */ in emit_ldx()
747 EMIT2(add_2mod(0x48, src_reg, dst_reg), 0x8B); in emit_ldx()
764 EMIT2(add_2mod(0x40, dst_reg, src_reg), 0x88); in emit_stx()
766 EMIT1(0x88); in emit_stx()
770 EMIT3(0x66, add_2mod(0x40, dst_reg, src_reg), 0x89); in emit_stx()
772 EMIT2(0x66, 0x89); in emit_stx()
776 EMIT2(add_2mod(0x40, dst_reg, src_reg), 0x89); in emit_stx()
778 EMIT1(0x89); in emit_stx()
781 EMIT2(add_2mod(0x48, dst_reg, src_reg), 0x89); in emit_stx()
793 EMIT1(0xF0); /* lock prefix */ in emit_atomic()
809 EMIT2(0x0F, 0xC1); in emit_atomic()
813 EMIT1(0x87); in emit_atomic()
817 EMIT2(0x0F, 0xB1); in emit_atomic()
827 return 0; in emit_atomic()
837 *(unsigned long *)((void *)regs + reg) = 0; in ex_handler_bpf()
838 regs->ip += x->fixup & 0xff; in ex_handler_bpf()
851 regs_used[0] = true; in detect_reg_usage()
866 while (len > 0) { in emit_nops()
872 for (i = 0; i < noplen; i++) in emit_nops()
892 int i, excnt = 0; in do_jit()
893 int ilen, proglen = 0; in do_jit()
905 bpf_prog->aux->func_idx != 0); in do_jit()
912 addrs[0] = proglen; in do_jit()
919 u8 b2 = 0, b3 = 0; in do_jit()
941 EMIT2(b2, add_2reg(0xC0, dst_reg, src_reg)); in do_jit()
955 EMIT1(add_1mod(0x48, dst_reg)); in do_jit()
957 EMIT1(add_1mod(0x40, dst_reg)); in do_jit()
958 EMIT2(0xF7, add_1reg(0xD8, dst_reg)); in do_jit()
972 EMIT1(add_1mod(0x48, dst_reg)); in do_jit()
974 EMIT1(add_1mod(0x40, dst_reg)); in do_jit()
982 b3 = 0xC0; in do_jit()
983 b2 = 0x05; in do_jit()
986 b3 = 0xE8; in do_jit()
987 b2 = 0x2D; in do_jit()
990 b3 = 0xE0; in do_jit()
991 b2 = 0x25; in do_jit()
994 b3 = 0xC8; in do_jit()
995 b2 = 0x0D; in do_jit()
998 b3 = 0xF0; in do_jit()
999 b2 = 0x35; in do_jit()
1004 EMIT3(0x83, add_1reg(b3, dst_reg), imm32); in do_jit()
1008 EMIT2_off32(0x81, add_1reg(b3, dst_reg), imm32); in do_jit()
1018 emit_mov_imm64(&prog, dst_reg, insn[1].imm, insn[0].imm); in do_jit()
1032 EMIT1(0x50); /* push rax */ in do_jit()
1033 EMIT1(0x52); /* push rdx */ in do_jit()
1040 EMIT3_off32(0x49, 0xC7, 0xC3, imm32); in do_jit()
1049 EMIT2(0x31, 0xd2); in do_jit()
1053 EMIT3(0x49, 0xF7, 0xF3); in do_jit()
1056 EMIT3(0x41, 0xF7, 0xF3); in do_jit()
1060 EMIT3(0x49, 0x89, 0xD3); in do_jit()
1063 EMIT3(0x49, 0x89, 0xC3); in do_jit()
1065 EMIT1(0x5A); /* pop rdx */ in do_jit()
1066 EMIT1(0x58); /* pop rax */ in do_jit()
1080 EMIT1(0x50); /* push rax */ in do_jit()
1082 EMIT1(0x52); /* push rdx */ in do_jit()
1093 EMIT1(add_1mod(0x48, AUX_REG)); in do_jit()
1095 EMIT1(add_1mod(0x40, AUX_REG)); in do_jit()
1097 EMIT2(0xF7, add_1reg(0xE0, AUX_REG)); in do_jit()
1100 EMIT1(0x5A); /* pop rdx */ in do_jit()
1104 EMIT1(0x58); /* pop rax */ in do_jit()
1116 EMIT1(add_1mod(0x48, dst_reg)); in do_jit()
1118 EMIT1(add_1mod(0x40, dst_reg)); in do_jit()
1122 EMIT2(0xD1, add_1reg(b3, dst_reg)); in do_jit()
1124 EMIT3(0xC1, add_1reg(b3, dst_reg), imm32); in do_jit()
1142 EMIT1(0x51); /* push rcx */ in do_jit()
1150 EMIT1(add_1mod(0x48, dst_reg)); in do_jit()
1152 EMIT1(add_1mod(0x40, dst_reg)); in do_jit()
1155 EMIT2(0xD3, add_1reg(b3, dst_reg)); in do_jit()
1158 EMIT1(0x59); /* pop rcx */ in do_jit()
1169 EMIT1(0x66); in do_jit()
1171 EMIT1(0x41); in do_jit()
1172 EMIT3(0xC1, add_1reg(0xC8, dst_reg), 8); in do_jit()
1176 EMIT3(0x45, 0x0F, 0xB7); in do_jit()
1178 EMIT2(0x0F, 0xB7); in do_jit()
1179 EMIT1(add_2reg(0xC0, dst_reg, dst_reg)); in do_jit()
1184 EMIT2(0x41, 0x0F); in do_jit()
1186 EMIT1(0x0F); in do_jit()
1187 EMIT1(add_1reg(0xC8, dst_reg)); in do_jit()
1191 EMIT3(add_1mod(0x48, dst_reg), 0x0F, in do_jit()
1192 add_1reg(0xC8, dst_reg)); in do_jit()
1205 EMIT3(0x45, 0x0F, 0xB7); in do_jit()
1207 EMIT2(0x0F, 0xB7); in do_jit()
1208 EMIT1(add_2reg(0xC0, dst_reg, dst_reg)); in do_jit()
1213 EMIT1(0x45); in do_jit()
1214 EMIT2(0x89, add_2reg(0xC0, dst_reg, dst_reg)); in do_jit()
1226 EMIT3(0x0F, 0xAE, 0xE8); in do_jit()
1232 EMIT2(0x41, 0xC6); in do_jit()
1234 EMIT1(0xC6); in do_jit()
1238 EMIT3(0x66, 0x41, 0xC7); in do_jit()
1240 EMIT2(0x66, 0xC7); in do_jit()
1244 EMIT2(0x41, 0xC7); in do_jit()
1246 EMIT1(0xC7); in do_jit()
1249 EMIT2(add_1mod(0x48, dst_reg), 0xC7); in do_jit()
1252 EMIT2(add_1reg(0x40, dst_reg), insn->off); in do_jit()
1254 EMIT1_off32(add_1reg(0x80, dst_reg), insn->off); in do_jit()
1279 EMIT2(0x85, add_2reg(0xC0, src_reg, src_reg)); in do_jit()
1281 EMIT2(X86_JNE, 0); in do_jit()
1283 emit_mov_imm32(&prog, false, dst_reg, 0); in do_jit()
1285 EMIT2(0xEB, 0); in do_jit()
1332 * End result: x86 insn "mov rbx, qword ptr [rax+0x14]" in do_jit()
1372 add_2reg(0xC0, AUX_REG, real_src_reg)); in do_jit()
1402 EMIT3_off32(0x48, 0x8B, 0x85, in do_jit()
1448 EMIT2(0x39, add_2reg(0xC0, dst_reg, src_reg)); in do_jit()
1456 EMIT2(0x85, add_2reg(0xC0, dst_reg, src_reg)); in do_jit()
1463 EMIT1(add_1mod(0x48, dst_reg)); in do_jit()
1465 EMIT1(add_1mod(0x40, dst_reg)); in do_jit()
1466 EMIT2_off32(0xF7, add_1reg(0xC0, dst_reg), imm32); in do_jit()
1490 if (imm32 == 0) { in do_jit()
1493 EMIT2(0x85, add_2reg(0xC0, dst_reg, dst_reg)); in do_jit()
1499 EMIT1(add_1mod(0x48, dst_reg)); in do_jit()
1501 EMIT1(add_1mod(0x40, dst_reg)); in do_jit()
1504 EMIT3(0x83, add_1reg(0xF8, dst_reg), imm32); in do_jit()
1506 EMIT2_off32(0x81, add_1reg(0xF8, dst_reg), imm32); in do_jit()
1561 * "nops" is 0. in do_jit()
1571 if (nops != 0 && nops != 4) { in do_jit()
1580 EMIT2_off32(0x0F, jmp_cond + 0x10, jmp_offset); in do_jit()
1609 * to pad any extra byte (0 byte). in do_jit()
1617 if (nops != 0 && nops != 2 && nops != 5) { in do_jit()
1634 * jmp, there is nothing to pad (0 byte). in do_jit()
1642 if (nops != 0 && nops != 3) { in do_jit()
1649 EMIT2(0xEB, jmp_offset); in do_jit()
1651 EMIT1_off32(0xE9, jmp_offset); in do_jit()
1667 EMIT1(0xC9); /* leave */ in do_jit()
1668 EMIT1(0xC3); /* ret */ in do_jit()
1722 * mov QWORD PTR [rbp-0x10],rdi in save_regs()
1723 * mov QWORD PTR [rbp-0x8],rsi in save_regs()
1725 for (i = 0; i < min(nr_args, 6); i++) in save_regs()
1739 * EMIT4(0x48, 0x8B, 0x7D, 0xF0); mov rdi,QWORD PTR [rbp-0x10] in restore_regs()
1740 * EMIT4(0x48, 0x8B, 0x75, 0xF8); mov rsi,QWORD PTR [rbp-0x8] in restore_regs()
1742 for (i = 0; i < min(nr_args, 6); i++) in restore_regs()
1764 /* if (__bpf_prog_enter*(prog) == 0) in invoke_bpf_prog()
1767 EMIT3(0x48, 0x85, 0xC0); /* test rax,rax */ in invoke_bpf_prog()
1773 EMIT4(0x48, 0x8D, 0x7D, -stack_size); in invoke_bpf_prog()
1795 jmp_insn[0] = X86_JE; in invoke_bpf_prog()
1808 return 0; in invoke_bpf_prog()
1832 EMIT2_off32(0x0F, jmp_cond + 0x10, offset); in emit_cond_near_jump()
1834 return 0; in emit_cond_near_jump()
1844 for (i = 0; i < tp->nr_progs; i++) { in invoke_bpf()
1850 return 0; in invoke_bpf()
1861 * Set this to 0 to avoid confusing the program. in invoke_bpf_mod_ret()
1863 emit_mov_imm32(&prog, false, BPF_REG_0, 0); in invoke_bpf_mod_ret()
1865 for (i = 0; i < tp->nr_progs; i++) { in invoke_bpf_mod_ret()
1870 * if (*(u64 *)(rbp - 8) != 0) in invoke_bpf_mod_ret()
1873 /* cmp QWORD PTR [rbp - 0x8], 0x0 */ in invoke_bpf_mod_ret()
1874 EMIT4(0x48, 0x83, 0x7d, 0xf8); EMIT1(0x00); in invoke_bpf_mod_ret()
1886 return 0; in invoke_bpf_mod_ret()
2003 EMIT1(0x55); /* push rbp */ in arch_prepare_bpf_trampoline()
2004 EMIT3(0x48, 0x89, 0xE5); /* mov rbp, rsp */ in arch_prepare_bpf_trampoline()
2005 EMIT4(0x48, 0x83, 0xEC, stack_size); /* sub rsp, stack_size */ in arch_prepare_bpf_trampoline()
2006 EMIT1(0x53); /* push rbx */ in arch_prepare_bpf_trampoline()
2015 EMIT4(0x48, 0x83, 0xe8, X86_PATCH_SIZE); in arch_prepare_bpf_trampoline()
2078 for (i = 0; i < fmod_ret->nr_progs; i++) in arch_prepare_bpf_trampoline()
2109 EMIT1(0x5B); /* pop rbx */ in arch_prepare_bpf_trampoline()
2110 EMIT1(0xC9); /* leave */ in arch_prepare_bpf_trampoline()
2113 EMIT4(0x48, 0x83, 0xC4, 8); /* add rsp, 8 */ in arch_prepare_bpf_trampoline()
2114 EMIT1(0xC3); /* ret */ in arch_prepare_bpf_trampoline()
2130 int err = 0; in emit_fallback_jump()
2139 EMIT2(0xFF, 0xE2); /* jmp rdx */ in emit_fallback_jump()
2155 EMIT1(add_1mod(0x48, BPF_REG_3)); /* cmp rdx,func */ in emit_bpf_dispatcher()
2158 EMIT2_off32(0x81, add_1reg(0xF8, BPF_REG_3), in emit_bpf_dispatcher()
2171 return 0; in emit_bpf_dispatcher()
2178 EMIT1(add_1mod(0x48, BPF_REG_3)); /* cmp rdx,func */ in emit_bpf_dispatcher()
2181 EMIT2_off32(0x81, add_1reg(0xF8, BPF_REG_3), progs[a + pivot]); in emit_bpf_dispatcher()
2186 EMIT2_off32(0x0F, X86_JG + 0x10, 0); in emit_bpf_dispatcher()
2188 EMIT2(X86_JG, 0); in emit_bpf_dispatcher()
2212 return 0; in emit_bpf_dispatcher()
2224 return 0; in cmp_ips()
2231 sort(funcs, num_funcs, sizeof(funcs[0]), cmp_ips, NULL); in arch_prepare_bpf_dispatcher()
2232 return emit_bpf_dispatcher(&prog, 0, num_funcs - 1, funcs); in arch_prepare_bpf_dispatcher()
2251 int proglen, oldproglen = 0; in bpf_int_jit_compile()
2305 for (proglen = 0, i = 0; i <= prog->len; i++) { in bpf_int_jit_compile()
2318 for (pass = 0; pass < MAX_PASSES || image; pass++) { in bpf_int_jit_compile()
2322 if (proglen <= 0) { in bpf_int_jit_compile()