diff --git a/src/arch/x86/isa/decoder/two_byte_opcodes.isa b/src/arch/x86/isa/decoder/two_byte_opcodes.isa --- a/src/arch/x86/isa/decoder/two_byte_opcodes.isa +++ b/src/arch/x86/isa/decoder/two_byte_opcodes.isa @@ -669,7 +669,7 @@ } // repne (0xF2) 0x8: decode OPCODE_OP_BOTTOM3 { - 0x4: WarnUnimpl::haddps_Vo_Wo(); + 0x4: HADDPS(Vo,Wo); 0x5: WarnUnimpl::hsubps_Vo_Wo(); default: UD2(); } diff --git a/src/arch/x86/isa/insts/simd128/floating_point/arithmetic/horizontal_addition.py b/src/arch/x86/isa/insts/simd128/floating_point/arithmetic/horizontal_addition.py --- a/src/arch/x86/isa/insts/simd128/floating_point/arithmetic/horizontal_addition.py +++ b/src/arch/x86/isa/insts/simd128/floating_point/arithmetic/horizontal_addition.py @@ -36,7 +36,43 @@ # Authors: Gabe Black microcode = ''' -# HADDPS +def macroop HADDPS_XMM_XMM { + shuffle ufp1, xmml, xmmh, ext=((0 << 0) | (2 << 2)), size=4 + shuffle ufp2, xmml, xmmh, ext=((1 << 0) | (3 << 2)), size=4 + shuffle ufp3, xmmlm, xmmhm, ext=((0 << 0) | (2 << 2)), size=4 + shuffle ufp4, xmmlm, xmmhm, ext=((1 << 0) | (3 << 2)), size=4 + + maddf xmml, ufp1, ufp2, size=4 + maddf xmmh, ufp3, ufp4, size=4 +}; + +def macroop HADDPS_XMM_M { + shuffle ufp1, xmml, xmmh, ext=((0 << 0) | (2 << 2)), size=4 + shuffle ufp2, xmml, xmmh, ext=((1 << 0) | (3 << 2)), size=4 + + ldfp ufp3, seg, sib, disp, dataSize=8 + ldfp ufp4, seg, sib, "DISPLACEMENT+8", dataSize=8 + shuffle ufp5, ufp3, ufp4, ext=((0 << 0) | (2 << 2)), size=4 + shuffle ufp3, ufp3, ufp4, ext=((1 << 0) | (3 << 2)), size=4 + + maddf xmml, ufp1, ufp2, size=4 + maddf xmmh, ufp3, ufp5, size=4 +}; + +def macroop HADDPS_XMM_P { + rdip t7 + + shuffle ufp1, xmml, xmmh, ext=((0 << 0) | (2 << 2)), size=4 + shuffle ufp2, xmml, xmmh, ext=((1 << 0) | (3 << 2)), size=4 + + ldfp ufp3, seg, riprel, disp, dataSize=8 + ldfp ufp4, seg, riprel, "DISPLACEMENT+8", dataSize=8 + shuffle ufp5, ufp3, ufp4, ext=((0 << 0) | (2 << 2)), size=4 + shuffle ufp3, ufp3, ufp4, ext=((1 << 0) | (3 << 2)), size=4 + + maddf xmml, ufp1, ufp2, size=4 + maddf xmmh, ufp3, ufp5, size=4 +}; def macroop HADDPD_XMM_XMM { maddf ufp1, xmmh , xmml, size=8, ext=Scalar