KVM: emulate: protect checks on ctxt->d by a common "if (unlikely())"
There are several checks for "peculiar" aspects of instructions in both x86_decode_insn and x86_emulate_insn. Group them together, and guard them with a single "if" that lets the processor quickly skip them all. Make this more effective by adding two more flag bits that say whether the .intercept and .check_perm fields are valid. We will reuse these flags later to avoid initializing fields of the emulate_ctxt struct. This skims about 30 cycles for each emulated instructions, which is approximately a 3% improvement. Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
This commit is contained in:
		
					parent
					
						
							
								e24186e097
							
						
					
				
			
			
				commit
				
					
						d40a6898e5
					
				
			
		
					 1 changed files with 97 additions and 84 deletions
				
			
		|  | @ -162,6 +162,8 @@ | ||||||
| #define NoWrite     ((u64)1 << 45)  /* No writeback */ | #define NoWrite     ((u64)1 << 45)  /* No writeback */ | ||||||
| #define SrcWrite    ((u64)1 << 46)  /* Write back src operand */ | #define SrcWrite    ((u64)1 << 46)  /* Write back src operand */ | ||||||
| #define NoMod	    ((u64)1 << 47)  /* Mod field is ignored */ | #define NoMod	    ((u64)1 << 47)  /* Mod field is ignored */ | ||||||
|  | #define Intercept   ((u64)1 << 48)  /* Has valid intercept field */ | ||||||
|  | #define CheckPerm   ((u64)1 << 49)  /* Has valid check_perm field */ | ||||||
| 
 | 
 | ||||||
| #define DstXacc     (DstAccLo | SrcAccHi | SrcWrite) | #define DstXacc     (DstAccLo | SrcAccHi | SrcWrite) | ||||||
| 
 | 
 | ||||||
|  | @ -3546,9 +3548,9 @@ static int check_perm_out(struct x86_emulate_ctxt *ctxt) | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| #define D(_y) { .flags = (_y) } | #define D(_y) { .flags = (_y) } | ||||||
| #define DI(_y, _i) { .flags = (_y), .intercept = x86_intercept_##_i } | #define DI(_y, _i) { .flags = (_y)|Intercept, .intercept = x86_intercept_##_i } | ||||||
| #define DIP(_y, _i, _p) { .flags = (_y), .intercept = x86_intercept_##_i, \ | #define DIP(_y, _i, _p) { .flags = (_y)|Intercept|CheckPerm, \ | ||||||
| 		      .check_perm = (_p) } | 		      .intercept = x86_intercept_##_i, .check_perm = (_p) } | ||||||
| #define N    D(NotImpl) | #define N    D(NotImpl) | ||||||
| #define EXT(_f, _e) { .flags = ((_f) | RMExt), .u.group = (_e) } | #define EXT(_f, _e) { .flags = ((_f) | RMExt), .u.group = (_e) } | ||||||
| #define G(_f, _g) { .flags = ((_f) | Group | ModRM), .u.group = (_g) } | #define G(_f, _g) { .flags = ((_f) | Group | ModRM), .u.group = (_g) } | ||||||
|  | @ -3557,10 +3559,10 @@ static int check_perm_out(struct x86_emulate_ctxt *ctxt) | ||||||
| #define I(_f, _e) { .flags = (_f), .u.execute = (_e) } | #define I(_f, _e) { .flags = (_f), .u.execute = (_e) } | ||||||
| #define F(_f, _e) { .flags = (_f) | Fastop, .u.fastop = (_e) } | #define F(_f, _e) { .flags = (_f) | Fastop, .u.fastop = (_e) } | ||||||
| #define II(_f, _e, _i) \ | #define II(_f, _e, _i) \ | ||||||
| 	{ .flags = (_f), .u.execute = (_e), .intercept = x86_intercept_##_i } | 	{ .flags = (_f)|Intercept, .u.execute = (_e), .intercept = x86_intercept_##_i } | ||||||
| #define IIP(_f, _e, _i, _p) \ | #define IIP(_f, _e, _i, _p) \ | ||||||
| 	{ .flags = (_f), .u.execute = (_e), .intercept = x86_intercept_##_i, \ | 	{ .flags = (_f)|Intercept|CheckPerm, .u.execute = (_e), \ | ||||||
| 	  .check_perm = (_p) } | 	  .intercept = x86_intercept_##_i, .check_perm = (_p) } | ||||||
| #define GP(_f, _g) { .flags = ((_f) | Prefix), .u.gprefix = (_g) } | #define GP(_f, _g) { .flags = ((_f) | Prefix), .u.gprefix = (_g) } | ||||||
| 
 | 
 | ||||||
| #define D2bv(_f)      D((_f) | ByteOp), D(_f) | #define D2bv(_f)      D((_f) | ByteOp), D(_f) | ||||||
|  | @ -4393,29 +4395,37 @@ done_prefixes: | ||||||
| 		return EMULATION_FAILED; | 		return EMULATION_FAILED; | ||||||
| 
 | 
 | ||||||
| 	ctxt->execute = opcode.u.execute; | 	ctxt->execute = opcode.u.execute; | ||||||
| 	ctxt->check_perm = opcode.check_perm; |  | ||||||
| 	ctxt->intercept = opcode.intercept; |  | ||||||
| 
 | 
 | ||||||
| 	if (ctxt->d & NotImpl) | 	if (unlikely(ctxt->d & | ||||||
| 		return EMULATION_FAILED; | 		     (NotImpl|EmulateOnUD|Stack|Op3264|Sse|Mmx|Intercept|CheckPerm))) { | ||||||
|  | 		/*
 | ||||||
|  | 		 * These are copied unconditionally here, and checked unconditionally | ||||||
|  | 		 * in x86_emulate_insn. | ||||||
|  | 		 */ | ||||||
|  | 		ctxt->check_perm = opcode.check_perm; | ||||||
|  | 		ctxt->intercept = opcode.intercept; | ||||||
| 
 | 
 | ||||||
| 	if (!(ctxt->d & EmulateOnUD) && ctxt->ud) | 		if (ctxt->d & NotImpl) | ||||||
| 		return EMULATION_FAILED; | 			return EMULATION_FAILED; | ||||||
| 
 | 
 | ||||||
| 	if (mode == X86EMUL_MODE_PROT64 && (ctxt->d & Stack)) | 		if (!(ctxt->d & EmulateOnUD) && ctxt->ud) | ||||||
| 		ctxt->op_bytes = 8; | 			return EMULATION_FAILED; | ||||||
| 
 | 
 | ||||||
| 	if (ctxt->d & Op3264) { | 		if (mode == X86EMUL_MODE_PROT64 && (ctxt->d & Stack)) | ||||||
| 		if (mode == X86EMUL_MODE_PROT64) |  | ||||||
| 			ctxt->op_bytes = 8; | 			ctxt->op_bytes = 8; | ||||||
| 		else |  | ||||||
| 			ctxt->op_bytes = 4; |  | ||||||
| 	} |  | ||||||
| 
 | 
 | ||||||
| 	if (ctxt->d & Sse) | 		if (ctxt->d & Op3264) { | ||||||
| 		ctxt->op_bytes = 16; | 			if (mode == X86EMUL_MODE_PROT64) | ||||||
| 	else if (ctxt->d & Mmx) | 				ctxt->op_bytes = 8; | ||||||
| 		ctxt->op_bytes = 8; | 			else | ||||||
|  | 				ctxt->op_bytes = 4; | ||||||
|  | 		} | ||||||
|  | 
 | ||||||
|  | 		if (ctxt->d & Sse) | ||||||
|  | 			ctxt->op_bytes = 16; | ||||||
|  | 		else if (ctxt->d & Mmx) | ||||||
|  | 			ctxt->op_bytes = 8; | ||||||
|  | 	} | ||||||
| 
 | 
 | ||||||
| 	/* ModRM and SIB bytes. */ | 	/* ModRM and SIB bytes. */ | ||||||
| 	if (ctxt->d & ModRM) { | 	if (ctxt->d & ModRM) { | ||||||
|  | @ -4549,76 +4559,79 @@ int x86_emulate_insn(struct x86_emulate_ctxt *ctxt) | ||||||
| 		goto done; | 		goto done; | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if ((ctxt->mode == X86EMUL_MODE_PROT64 && (ctxt->d & No64)) || | 	if (unlikely(ctxt->d & | ||||||
| 			(ctxt->d & Undefined)) { | 		     (No64|Undefined|Sse|Mmx|Intercept|CheckPerm|Priv|Prot|String))) { | ||||||
| 		rc = emulate_ud(ctxt); | 		if ((ctxt->mode == X86EMUL_MODE_PROT64 && (ctxt->d & No64)) || | ||||||
| 		goto done; | 				(ctxt->d & Undefined)) { | ||||||
| 	} | 			rc = emulate_ud(ctxt); | ||||||
| 
 |  | ||||||
| 	if (((ctxt->d & (Sse|Mmx)) && ((ops->get_cr(ctxt, 0) & X86_CR0_EM))) |  | ||||||
| 	    || ((ctxt->d & Sse) && !(ops->get_cr(ctxt, 4) & X86_CR4_OSFXSR))) { |  | ||||||
| 		rc = emulate_ud(ctxt); |  | ||||||
| 		goto done; |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	if ((ctxt->d & (Sse|Mmx)) && (ops->get_cr(ctxt, 0) & X86_CR0_TS)) { |  | ||||||
| 		rc = emulate_nm(ctxt); |  | ||||||
| 		goto done; |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	if (ctxt->d & Mmx) { |  | ||||||
| 		rc = flush_pending_x87_faults(ctxt); |  | ||||||
| 		if (rc != X86EMUL_CONTINUE) |  | ||||||
| 			goto done; | 			goto done; | ||||||
| 		/*
 | 		} | ||||||
| 		 * Now that we know the fpu is exception safe, we can fetch |  | ||||||
| 		 * operands from it. |  | ||||||
| 		 */ |  | ||||||
| 		fetch_possible_mmx_operand(ctxt, &ctxt->src); |  | ||||||
| 		fetch_possible_mmx_operand(ctxt, &ctxt->src2); |  | ||||||
| 		if (!(ctxt->d & Mov)) |  | ||||||
| 			fetch_possible_mmx_operand(ctxt, &ctxt->dst); |  | ||||||
| 	} |  | ||||||
| 
 | 
 | ||||||
| 	if (unlikely(ctxt->guest_mode) && ctxt->intercept) { | 		if (((ctxt->d & (Sse|Mmx)) && ((ops->get_cr(ctxt, 0) & X86_CR0_EM))) | ||||||
| 		rc = emulator_check_intercept(ctxt, ctxt->intercept, | 		    || ((ctxt->d & Sse) && !(ops->get_cr(ctxt, 4) & X86_CR4_OSFXSR))) { | ||||||
| 					      X86_ICPT_PRE_EXCEPT); | 			rc = emulate_ud(ctxt); | ||||||
| 		if (rc != X86EMUL_CONTINUE) |  | ||||||
| 			goto done; | 			goto done; | ||||||
| 	} | 		} | ||||||
| 
 | 
 | ||||||
| 	/* Privileged instruction can be executed only in CPL=0 */ | 		if ((ctxt->d & (Sse|Mmx)) && (ops->get_cr(ctxt, 0) & X86_CR0_TS)) { | ||||||
| 	if ((ctxt->d & Priv) && ops->cpl(ctxt)) { | 			rc = emulate_nm(ctxt); | ||||||
| 		rc = emulate_gp(ctxt, 0); |  | ||||||
| 		goto done; |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	/* Instruction can only be executed in protected mode */ |  | ||||||
| 	if ((ctxt->d & Prot) && ctxt->mode < X86EMUL_MODE_PROT16) { |  | ||||||
| 		rc = emulate_ud(ctxt); |  | ||||||
| 		goto done; |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	/* Do instruction specific permission checks */ |  | ||||||
| 	if (ctxt->check_perm) { |  | ||||||
| 		rc = ctxt->check_perm(ctxt); |  | ||||||
| 		if (rc != X86EMUL_CONTINUE) |  | ||||||
| 			goto done; | 			goto done; | ||||||
| 	} | 		} | ||||||
| 
 | 
 | ||||||
| 	if (unlikely(ctxt->guest_mode) && ctxt->intercept) { | 		if (ctxt->d & Mmx) { | ||||||
| 		rc = emulator_check_intercept(ctxt, ctxt->intercept, | 			rc = flush_pending_x87_faults(ctxt); | ||||||
| 					      X86_ICPT_POST_EXCEPT); | 			if (rc != X86EMUL_CONTINUE) | ||||||
| 		if (rc != X86EMUL_CONTINUE) | 				goto done; | ||||||
| 			goto done; | 			/*
 | ||||||
| 	} | 			 * Now that we know the fpu is exception safe, we can fetch | ||||||
|  | 			 * operands from it. | ||||||
|  | 			 */ | ||||||
|  | 			fetch_possible_mmx_operand(ctxt, &ctxt->src); | ||||||
|  | 			fetch_possible_mmx_operand(ctxt, &ctxt->src2); | ||||||
|  | 			if (!(ctxt->d & Mov)) | ||||||
|  | 				fetch_possible_mmx_operand(ctxt, &ctxt->dst); | ||||||
|  | 		} | ||||||
| 
 | 
 | ||||||
| 	if (ctxt->rep_prefix && (ctxt->d & String)) { | 		if (unlikely(ctxt->guest_mode) && ctxt->intercept) { | ||||||
| 		/* All REP prefixes have the same first termination condition */ | 			rc = emulator_check_intercept(ctxt, ctxt->intercept, | ||||||
| 		if (address_mask(ctxt, reg_read(ctxt, VCPU_REGS_RCX)) == 0) { | 						      X86_ICPT_PRE_EXCEPT); | ||||||
| 			ctxt->eip = ctxt->_eip; | 			if (rc != X86EMUL_CONTINUE) | ||||||
|  | 				goto done; | ||||||
|  | 		} | ||||||
|  | 
 | ||||||
|  | 		/* Privileged instruction can be executed only in CPL=0 */ | ||||||
|  | 		if ((ctxt->d & Priv) && ops->cpl(ctxt)) { | ||||||
|  | 			rc = emulate_gp(ctxt, 0); | ||||||
| 			goto done; | 			goto done; | ||||||
| 		} | 		} | ||||||
|  | 
 | ||||||
|  | 		/* Instruction can only be executed in protected mode */ | ||||||
|  | 		if ((ctxt->d & Prot) && ctxt->mode < X86EMUL_MODE_PROT16) { | ||||||
|  | 			rc = emulate_ud(ctxt); | ||||||
|  | 			goto done; | ||||||
|  | 		} | ||||||
|  | 
 | ||||||
|  | 		/* Do instruction specific permission checks */ | ||||||
|  | 		if (ctxt->check_perm) { | ||||||
|  | 			rc = ctxt->check_perm(ctxt); | ||||||
|  | 			if (rc != X86EMUL_CONTINUE) | ||||||
|  | 				goto done; | ||||||
|  | 		} | ||||||
|  | 
 | ||||||
|  | 		if (unlikely(ctxt->guest_mode) && ctxt->intercept) { | ||||||
|  | 			rc = emulator_check_intercept(ctxt, ctxt->intercept, | ||||||
|  | 						      X86_ICPT_POST_EXCEPT); | ||||||
|  | 			if (rc != X86EMUL_CONTINUE) | ||||||
|  | 				goto done; | ||||||
|  | 		} | ||||||
|  | 
 | ||||||
|  | 		if (ctxt->rep_prefix && (ctxt->d & String)) { | ||||||
|  | 			/* All REP prefixes have the same first termination condition */ | ||||||
|  | 			if (address_mask(ctxt, reg_read(ctxt, VCPU_REGS_RCX)) == 0) { | ||||||
|  | 				ctxt->eip = ctxt->_eip; | ||||||
|  | 				goto done; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if ((ctxt->src.type == OP_MEM) && !(ctxt->d & NoAccess)) { | 	if ((ctxt->src.type == OP_MEM) && !(ctxt->d & NoAccess)) { | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 Paolo Bonzini
				Paolo Bonzini