Skip to content

Commit b3356bf

Browse files
Gleb Natapovavikivity
authored andcommitted
KVM: emulator: optimize "rep ins" handling
Optimize "rep ins" by allowing emulator to write back more than one datum at a time. Introduce new operand type OP_MEM_STR which tells writeback() that dst contains pointer to an array that should be written back as opposite to just one data element. Signed-off-by: Gleb Natapov <[email protected]> Signed-off-by: Avi Kivity <[email protected]>
1 parent f3bd64c commit b3356bf

File tree

2 files changed

+31
-6
lines changed

2 files changed

+31
-6
lines changed

arch/x86/include/asm/kvm_emulate.h

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -213,8 +213,9 @@ typedef u32 __attribute__((vector_size(16))) sse128_t;
213213

214214
/* Type, address-of, and value of an instruction's operand. */
215215
struct operand {
216-
enum { OP_REG, OP_MEM, OP_IMM, OP_XMM, OP_MM, OP_NONE } type;
216+
enum { OP_REG, OP_MEM, OP_MEM_STR, OP_IMM, OP_XMM, OP_MM, OP_NONE } type;
217217
unsigned int bytes;
218+
unsigned int count;
218219
union {
219220
unsigned long orig_val;
220221
u64 orig_val64;
@@ -234,6 +235,7 @@ struct operand {
234235
char valptr[sizeof(unsigned long) + 2];
235236
sse128_t vec_val;
236237
u64 mm_val;
238+
void *data;
237239
};
238240
};
239241

arch/x86/kvm/emulate.c

Lines changed: 28 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1301,8 +1301,15 @@ static int pio_in_emulated(struct x86_emulate_ctxt *ctxt,
13011301
rc->end = n * size;
13021302
}
13031303

1304-
memcpy(dest, rc->data + rc->pos, size);
1305-
rc->pos += size;
1304+
if (ctxt->rep_prefix && !(ctxt->eflags & EFLG_DF)) {
1305+
ctxt->dst.data = rc->data + rc->pos;
1306+
ctxt->dst.type = OP_MEM_STR;
1307+
ctxt->dst.count = (rc->end - rc->pos) / size;
1308+
rc->pos = rc->end;
1309+
} else {
1310+
memcpy(dest, rc->data + rc->pos, size);
1311+
rc->pos += size;
1312+
}
13061313
return 1;
13071314
}
13081315

@@ -1546,6 +1553,14 @@ static int writeback(struct x86_emulate_ctxt *ctxt)
15461553
if (rc != X86EMUL_CONTINUE)
15471554
return rc;
15481555
break;
1556+
case OP_MEM_STR:
1557+
rc = segmented_write(ctxt,
1558+
ctxt->dst.addr.mem,
1559+
ctxt->dst.data,
1560+
ctxt->dst.bytes * ctxt->dst.count);
1561+
if (rc != X86EMUL_CONTINUE)
1562+
return rc;
1563+
break;
15491564
case OP_XMM:
15501565
write_sse_reg(ctxt, &ctxt->dst.vec_val, ctxt->dst.addr.xmm);
15511566
break;
@@ -2793,7 +2808,7 @@ int emulator_task_switch(struct x86_emulate_ctxt *ctxt,
27932808
static void string_addr_inc(struct x86_emulate_ctxt *ctxt, int reg,
27942809
struct operand *op)
27952810
{
2796-
int df = (ctxt->eflags & EFLG_DF) ? -1 : 1;
2811+
int df = (ctxt->eflags & EFLG_DF) ? -op->count : op->count;
27972812

27982813
register_address_increment(ctxt, reg_rmw(ctxt, reg), df * op->bytes);
27992814
op->addr.mem.ea = register_address(ctxt, reg_read(ctxt, reg));
@@ -3733,7 +3748,7 @@ static const struct opcode opcode_table[256] = {
37333748
I(DstReg | SrcMem | ModRM | Src2Imm, em_imul_3op),
37343749
I(SrcImmByte | Mov | Stack, em_push),
37353750
I(DstReg | SrcMem | ModRM | Src2ImmByte, em_imul_3op),
3736-
I2bvIP(DstDI | SrcDX | Mov | String, em_in, ins, check_perm_in), /* insb, insw/insd */
3751+
I2bvIP(DstDI | SrcDX | Mov | String | Unaligned, em_in, ins, check_perm_in), /* insb, insw/insd */
37373752
I2bvIP(SrcSI | DstDX | String, em_out, outs, check_perm_out), /* outsb, outsw/outsd */
37383753
/* 0x70 - 0x7F */
37393754
X16(D(SrcImmByte)),
@@ -3991,6 +4006,7 @@ static int decode_operand(struct x86_emulate_ctxt *ctxt, struct operand *op,
39914006
register_address(ctxt, reg_read(ctxt, VCPU_REGS_RDI));
39924007
op->addr.mem.seg = VCPU_SREG_ES;
39934008
op->val = 0;
4009+
op->count = 1;
39944010
break;
39954011
case OpDX:
39964012
op->type = OP_REG;
@@ -4034,6 +4050,7 @@ static int decode_operand(struct x86_emulate_ctxt *ctxt, struct operand *op,
40344050
register_address(ctxt, reg_read(ctxt, VCPU_REGS_RSI));
40354051
op->addr.mem.seg = seg_override(ctxt);
40364052
op->val = 0;
4053+
op->count = 1;
40374054
break;
40384055
case OpImmFAddr:
40394056
op->type = OP_IMM;
@@ -4575,8 +4592,14 @@ int x86_emulate_insn(struct x86_emulate_ctxt *ctxt)
45754592
string_addr_inc(ctxt, VCPU_REGS_RDI, &ctxt->dst);
45764593

45774594
if (ctxt->rep_prefix && (ctxt->d & String)) {
4595+
unsigned int count;
45784596
struct read_cache *r = &ctxt->io_read;
4579-
register_address_increment(ctxt, reg_rmw(ctxt, VCPU_REGS_RCX), -1);
4597+
if ((ctxt->d & SrcMask) == SrcSI)
4598+
count = ctxt->src.count;
4599+
else
4600+
count = ctxt->dst.count;
4601+
register_address_increment(ctxt, reg_rmw(ctxt, VCPU_REGS_RCX),
4602+
-count);
45804603

45814604
if (!string_insn_completed(ctxt)) {
45824605
/*

0 commit comments

Comments
 (0)