mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-31 20:51:52 +01:00
AMDGPU: Fix v_dot{4, 8}* instruction encoding
Differential Revision: https://reviews.llvm.org/D46848 llvm-svn: 332387
This commit is contained in:
parent
059282774a
commit
952e2e92b4
@ -153,19 +153,24 @@ class getVOP3VCC<VOPProfile P, SDPatternOperator node> {
|
||||
(i1 VCC)))];
|
||||
}
|
||||
|
||||
class VOP3Features<bit Clamp, bit OpSel> {
|
||||
class VOP3Features<bit Clamp, bit OpSel, bit Packed> {
|
||||
bit HasClamp = Clamp;
|
||||
bit HasOpSel = OpSel;
|
||||
bit IsPacked = Packed;
|
||||
}
|
||||
|
||||
def VOP3_REGULAR : VOP3Features<0, 0>;
|
||||
def VOP3_CLAMP : VOP3Features<1, 0>;
|
||||
def VOP3_OPSEL : VOP3Features<1, 1>;
|
||||
def VOP3_REGULAR : VOP3Features<0, 0, 0>;
|
||||
def VOP3_CLAMP : VOP3Features<1, 0, 0>;
|
||||
def VOP3_OPSEL : VOP3Features<1, 1, 0>;
|
||||
def VOP3_PACKED : VOP3Features<1, 1, 1>;
|
||||
|
||||
class VOP3_Profile<VOPProfile P, VOP3Features Features = VOP3_REGULAR> : VOPProfile<P.ArgVT> {
|
||||
|
||||
let HasClamp = !if(Features.HasClamp, 1, P.HasClamp);
|
||||
let HasOpSel = !if(Features.HasOpSel, 1, P.HasOpSel);
|
||||
let IsPacked = !if(Features.IsPacked, 1, P.IsPacked);
|
||||
|
||||
let HasModifiers = !if(Features.IsPacked, 1, P.HasModifiers);
|
||||
|
||||
// FIXME: Hack to stop printing _e64
|
||||
let Outs64 = (outs DstRC.RegClass:$vdst);
|
||||
|
@ -170,10 +170,10 @@ let SubtargetPredicate = HasDLInsts in {
|
||||
def V_DOT2_F32_F16 : VOP3PInst<"v_dot2_f32_f16", VOP3_Profile<VOP_F32_V2F16_V2F16_F32>, int_amdgcn_fdot2>;
|
||||
def V_DOT2_I32_I16 : VOP3PInst<"v_dot2_i32_i16", VOP3_Profile<VOP_I32_V2I16_V2I16_I32>, int_amdgcn_sdot2>;
|
||||
def V_DOT2_U32_U16 : VOP3PInst<"v_dot2_u32_u16", VOP3_Profile<VOP_I32_V2I16_V2I16_I32>, int_amdgcn_udot2>;
|
||||
def V_DOT4_I32_I8 : VOP3Inst<"v_dot4_i32_i8", VOP3_Profile<VOP_I32_I32_I32_I32>, int_amdgcn_sdot4>;
|
||||
def V_DOT4_U32_U8 : VOP3Inst<"v_dot4_u32_u8", VOP3_Profile<VOP_I32_I32_I32_I32>, int_amdgcn_udot4>;
|
||||
def V_DOT8_I32_I4 : VOP3Inst<"v_dot8_i32_i4", VOP3_Profile<VOP_I32_I32_I32_I32>, int_amdgcn_sdot8>;
|
||||
def V_DOT8_U32_U4 : VOP3Inst<"v_dot8_u32_u4", VOP3_Profile<VOP_I32_I32_I32_I32>, int_amdgcn_udot8>;
|
||||
def V_DOT4_I32_I8 : VOP3PInst<"v_dot4_i32_i8", VOP3_Profile<VOP_I32_I32_I32_I32, VOP3_PACKED>, int_amdgcn_sdot4>;
|
||||
def V_DOT4_U32_U8 : VOP3PInst<"v_dot4_u32_u8", VOP3_Profile<VOP_I32_I32_I32_I32, VOP3_PACKED>, int_amdgcn_udot4>;
|
||||
def V_DOT8_I32_I4 : VOP3PInst<"v_dot8_i32_i4", VOP3_Profile<VOP_I32_I32_I32_I32, VOP3_PACKED>, int_amdgcn_sdot8>;
|
||||
def V_DOT8_U32_U4 : VOP3PInst<"v_dot8_u32_u4", VOP3_Profile<VOP_I32_I32_I32_I32, VOP3_PACKED>, int_amdgcn_udot8>;
|
||||
|
||||
} // End SubtargetPredicate = HasDLInsts
|
||||
|
||||
|
@ -378,13 +378,13 @@ v_dot2_f32_f16 v0, v1, v2, v3
|
||||
v_dot2_i32_i16 v0, v1, v2, v3
|
||||
// CHECK: encoding: [0x00,0x40,0xa7,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot2_u32_u16 v0, v1, v2, v3
|
||||
// CHECK: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
// CHECK: encoding: [0x00,0x40,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3
|
||||
// CHECK: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
// CHECK: encoding: [0x00,0x40,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3
|
||||
// CHECK: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
// CHECK: encoding: [0x00,0x40,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3
|
||||
// CHECK: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
// CHECK: encoding: [0x00,0x40,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3
|
||||
|
||||
//
|
||||
@ -535,6 +535,198 @@ v_dot2_u32_u16 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,1]
|
||||
v_dot2_u32_u16 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xa7,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot2_u32_u16 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x40,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,0]
|
||||
// CHECK: encoding: [0x00,0x50,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1]
|
||||
// CHECK: encoding: [0x00,0x48,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0]
|
||||
// CHECK: encoding: [0x00,0x58,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x40,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,0]
|
||||
// CHECK: encoding: [0x00,0x50,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1]
|
||||
// CHECK: encoding: [0x00,0x48,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0]
|
||||
// CHECK: encoding: [0x00,0x58,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x40,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,0]
|
||||
// CHECK: encoding: [0x00,0x50,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1]
|
||||
// CHECK: encoding: [0x00,0x48,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0]
|
||||
// CHECK: encoding: [0x00,0x58,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x40,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,0]
|
||||
// CHECK: encoding: [0x00,0x50,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1]
|
||||
// CHECK: encoding: [0x00,0x48,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0]
|
||||
// CHECK: encoding: [0x00,0x58,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,0] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0] op_sel_hi:[1,1]
|
||||
// CHECK: encoding: [0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[0,1]
|
||||
// CHECK: encoding: [0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,0]
|
||||
// CHECK: encoding: [0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1] op_sel_hi:[1,1]
|
||||
|
||||
//
|
||||
// Test clamp.
|
||||
@ -546,6 +738,14 @@ v_dot2_f32_f16 v0, v1, v2, v3 clamp
|
||||
v_dot2_i32_i16 v0, v1, v2, v3 clamp
|
||||
// CHECK: encoding: [0x00,0xc0,0xa7,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot2_u32_u16 v0, v1, v2, v3 clamp
|
||||
// CHECK: encoding: [0x00,0xc0,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_i32_i8 v0, v1, v2, v3 clamp
|
||||
// CHECK: encoding: [0x00,0xc0,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot4_u32_u8 v0, v1, v2, v3 clamp
|
||||
// CHECK: encoding: [0x00,0xc0,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_i32_i4 v0, v1, v2, v3 clamp
|
||||
// CHECK: encoding: [0x00,0xc0,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
v_dot8_u32_u4 v0, v1, v2, v3 clamp
|
||||
|
||||
//
|
||||
// Test neg_lo/neg_hi.
|
||||
|
@ -546,17 +546,17 @@
|
||||
# CHECK: v_dot2_u32_u16 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xa7,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xa7,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot2_f32_f16 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xa3,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xa3,0xd3,0x01,0x05,0x0e,0x1c
|
||||
@ -774,6 +774,294 @@
|
||||
# CHECK: v_dot2_u32_u16 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x18,0xa7,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x18,0xa7,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1,0] ; encoding: [0x00,0x50,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x50,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0,0] ; encoding: [0x00,0x48,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x48,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1,0] ; encoding: [0x00,0x58,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x58,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[0,0,0] ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[0,1,0] ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[1,0,0] ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[1,1,0] ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[0,0,0] ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[0,1,0] ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[1,0,0] ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel_hi:[1,1,0] ; encoding: [0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x00,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x10,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x08,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x18,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1,0] ; encoding: [0x00,0x50,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x50,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0,0] ; encoding: [0x00,0x48,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x48,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1,0] ; encoding: [0x00,0x58,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x58,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[0,0,0] ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[0,1,0] ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[1,0,0] ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[1,1,0] ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[0,0,0] ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[0,1,0] ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[1,0,0] ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel_hi:[1,1,0] ; encoding: [0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x00,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x10,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x08,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x18,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1,0] ; encoding: [0x00,0x50,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x50,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0,0] ; encoding: [0x00,0x48,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x48,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1,0] ; encoding: [0x00,0x58,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x58,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[0,0,0] ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[0,1,0] ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[1,0,0] ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[1,1,0] ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[0,0,0] ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[0,1,0] ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[1,0,0] ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel_hi:[1,1,0] ; encoding: [0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x00,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x10,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x08,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x18,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1,0] ; encoding: [0x00,0x50,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x50,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0,0] ; encoding: [0x00,0x48,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x48,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1,0] ; encoding: [0x00,0x58,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x58,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[0,0,0] ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[0,1,0] ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[1,0,0] ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[1,1,0] ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[0,0,0] ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[0,1,0] ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[1,0,0] ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel_hi:[1,1,0] ; encoding: [0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x00,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[0,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x10,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,0,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x08,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[0,0,0] ; encoding: [0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x04]
|
||||
0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x04
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[0,1,0] ; encoding: [0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x14]
|
||||
0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x14
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,0,0] ; encoding: [0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x0c]
|
||||
0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x0c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 op_sel:[1,1,0] op_sel_hi:[1,1,0] ; encoding: [0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x18,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot2_f32_f16 v0, v1, v2, v3 clamp ; encoding: [0x00,0xc0,0xa3,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0xc0,0xa3,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
@ -783,6 +1071,18 @@
|
||||
# CHECK: v_dot2_u32_u16 v0, v1, v2, v3 clamp ; encoding: [0x00,0xc0,0xa7,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0xc0,0xa7,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_i32_i8 v0, v1, v2, v3 clamp ; encoding: [0x00,0xc0,0xa8,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0xc0,0xa8,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot4_u32_u8 v0, v1, v2, v3 clamp ; encoding: [0x00,0xc0,0xa9,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0xc0,0xa9,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_i32_i4 v0, v1, v2, v3 clamp ; encoding: [0x00,0xc0,0xaa,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0xc0,0xaa,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot8_u32_u4 v0, v1, v2, v3 clamp ; encoding: [0x00,0xc0,0xab,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0xc0,0xab,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
# CHECK: v_dot2_f32_f16 v0, v1, v2, v3 ; encoding: [0x00,0x40,0xa3,0xd3,0x01,0x05,0x0e,0x1c]
|
||||
0x00,0x40,0xa3,0xd3,0x01,0x05,0x0e,0x1c
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user