Lines Matching full:inputs
36 Temp neg_b = fneg(inputs[1]);
37 writeout(0, bld.vop2(aco_opcode::v_mul_f32, bld.def(v1), inputs[0], neg_b));
43 Temp neg_a = fneg(inputs[0]);
49 writeout(2, bld.vop2(aco_opcode::v_mul_f32, bld.def(v1), neg_neg_a, inputs[1]));
54 writeout(3, bld.vop2(aco_opcode::v_mul_f32, bld.def(v1), abs_neg_a, inputs[1]));
58 Temp abs_a = fabs(inputs[0]);
60 writeout(4, bld.vop2(aco_opcode::v_mul_f32, bld.def(v1), neg_abs_a, inputs[1]));
64 … writeout(5, bld.vop2_dpp(aco_opcode::v_mul_f32, bld.def(v1), neg_a, inputs[1], dpp_row_sl(1)));
68 writeout(6, bld.vop2(aco_opcode::v_add_f32, bld.def(v1), neg_a, inputs[1]));
72 writeout(7, bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[1], neg_a));
76 Temp neg_c = fneg(bld.copy(bld.def(v1), inputs[2]));
77 writeout(8, bld.vop2(aco_opcode::v_mul_f32, bld.def(v1), inputs[0], neg_c));
82 writeout(9, bld.vop2(aco_opcode::v_mul_f32, bld.def(v1), abs_neg_abs_a, inputs[1]));
99 Temp tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
104 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
109 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
114 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
120 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
129 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
134 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
139 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
144 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
150 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
160 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
170 tmp = bld.vop2(aco_opcode::v_xor_b32, bld.def(v1), inputs[0], inputs[1]);
179 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
185 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
200 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
205 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
218 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
223 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
240 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
244 tmp = bld.vop2(aco_opcode::v_add_f32, bld.def(v1), inputs[0], inputs[1]);
256 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
260 tmp = bld.vop2(aco_opcode::v_add_f16, bld.def(v2b), inputs[0], inputs[1]);
282 subbrev = create_subbrev_co(Operand::zero(), Operand::zero(), Operand(inputs[2]));
283 writeout(0, bld.vop2(aco_opcode::v_and_b32, bld.def(v1), inputs[0], subbrev));
287 subbrev = create_subbrev_co(Operand::zero(), Operand::zero(), Operand(inputs[2]));
294 subbrev = create_subbrev_co(Operand::zero(), Operand::zero(), Operand(inputs[2]));
295 writeout(2, bld.vop2(aco_opcode::v_and_b32, bld.def(v1), inputs[1], subbrev));
301 subbrev = create_subbrev_co(Operand::zero(), Operand::zero(), Operand(inputs[2]));
302 Temp xor_a = bld.vop2(aco_opcode::v_xor_b32, bld.def(v1), inputs[0], subbrev);
308 Operand::c32(1u), Operand(inputs[2]));
310 writeout(4, bld.vop2(aco_opcode::v_and_b32, bld.def(v1), Operand(inputs[0]), sub));
328 shift = bld.sop2(aco_opcode::s_lshl_b32, bld.def(s1), bld.def(s1, scc), Operand(inputs[0]),
341 shift = bld.sop2(aco_opcode::s_lshl_b32, bld.def(s1), bld.def(s1, scc), Operand(inputs[0]),
345 Temp vadd = bld.vadd32(bld.def(v1), shift, Operand(inputs[1]));
353 bld.sop2(aco_opcode::s_lshl_b32, bld.def(s1), Operand(inputs[0]), Operand::c32(3u));
354 writeout(2, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
360 Operand a_24bit = Operand(inputs[0]);
363 writeout(3, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
370 Temp carry = bld.vadd32(bld.def(v1), lshl, Operand(inputs[1]), true).def(1).getTemp();
378 writeout(5, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
384 writeout(6, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
389 Operand a_16bit = Operand(inputs[0]);
392 writeout(7, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
408 bcnt = bld.vop3(aco_opcode::v_bcnt_u32_b32, bld.def(v1), Operand(inputs[0]), Operand::zero());
409 writeout(0, bld.vadd32(bld.def(v1), bcnt, Operand(inputs[0])));
413 bcnt = bld.vop3(aco_opcode::v_bcnt_u32_b32, bld.def(v1), Operand(inputs[0]), Operand::zero());
414 writeout(1, bld.vadd32(bld.def(v1), bcnt, Operand(inputs[1])));
418 bcnt = bld.vop3(aco_opcode::v_bcnt_u32_b32, bld.def(v1), Operand(inputs[0]), Operand::zero());
425 bcnt = bld.vop3(aco_opcode::v_bcnt_u32_b32, bld.def(v1), Operand(inputs[1]), Operand::zero());
426 writeout(3, bld.vadd32(bld.def(v1), bcnt, Operand(inputs[0])));
432 bcnt = bld.vop3(aco_opcode::v_bcnt_u32_b32, bld.def(v1), Operand(inputs[0]), Operand::zero());
433 Temp carry = bld.vadd32(bld.def(v1), bcnt, Operand(inputs[0]), true).def(1).getTemp();
492 bld.vop2(cfg.max, bld.def(v1), cfg.lb, inputs[0])));
497 bld.vop2(cfg.min, bld.def(v1), cfg.ub, inputs[0])));
504 bld.vop2(cfg.min, bld.def(v1), cfg.lb, inputs[0])));
510 bld.vop2(cfg.max, bld.def(v1), cfg.ub, inputs[0])));
517 writeout(4, bld.vop2(cfg.min, bld.def(v1), inputs[1],
518 bld.vop2(cfg.max, bld.def(v1), cfg.lb, inputs[0])));
524 bld.vop2(cfg.max, bld.def(v1), inputs[1], inputs[0])));
529 writeout(6, bld.vop2(cfg.min, bld.def(v1), inputs[1],
530 bld.vop2(cfg.max, bld.def(v1), inputs[2], inputs[0])));
536 Builder::Result max = bld.vop2(cfg.max, bld.def(v1), cfg.lb, inputs[0]);
545 min = bld.vop2(cfg.min, bld.def(v1), cfg.ub, inputs[0]);
563 bld.vopc(aco_opcode::v_cmp_neq_f32, bld.def(bld.lm), inputs[0], inputs[0]),
565 Operand::c32(0x40800000u), inputs[0])));
570 bld.vopc(aco_opcode::v_cmp_neq_f32, bld.def(bld.lm), inputs[0], inputs[0]),
572 Operand::c32(0x40800000u), inputs[0])));
577 bld.vopc(aco_opcode::v_cmp_neq_f32, bld.def(bld.lm), inputs[0], inputs[0]),
579 bld.copy(bld.def(v1), Operand::c32(0x40a00000u)), inputs[0])));
585 bld.vopc(aco_opcode::v_cmp_eq_f32, bld.def(bld.lm), inputs[0], inputs[0]),
587 Operand::c32(0x40800000u), inputs[0])));
592 bld.vopc(aco_opcode::v_cmp_eq_f32, bld.def(bld.lm), inputs[0], inputs[0]),
594 Operand::c32(0x40800000u), inputs[0])));
599 bld.vopc(aco_opcode::v_cmp_eq_f32, bld.def(bld.lm), inputs[0], inputs[0]),
601 bld.copy(bld.def(v1), Operand::c32(0x40a00000u)), inputs[0])));
609 bld.vopc(aco_opcode::v_cmp_lt_f32, bld.def(bld.lm), Operand::c32(0x40800000u), inputs[0]);
610 Temp src0 = bld.vopc(aco_opcode::v_cmp_neq_f32, bld.def(bld.lm), inputs[0], inputs[0]);
618 bld.vopc(aco_opcode::v_cmp_nge_f32, bld.def(bld.lm), Operand::c32(0x40800000u), inputs[0]);
619 src0 = bld.vopc(aco_opcode::v_cmp_eq_f32, bld.def(bld.lm), inputs[0], inputs[0]);
626 src1 = bld.vopc(aco_opcode::v_cmp_lt_f32, bld.def(bld.lm), Operand::c32(0x40800000u), inputs[3]);
627 src0 = bld.vopc(aco_opcode::v_cmp_neq_f32, bld.def(bld.lm), inputs[0], inputs[0]);
634 src1 = bld.vopc(aco_opcode::v_cmp_lt_f32, bld.def(bld.lm), Operand::c32(0x40800000u), inputs[0]);
635 src0 = bld.vopc(aco_opcode::v_cmp_neq_f32, bld.def(bld.lm), inputs[0], inputs[3]);
642 bld.pseudo(aco_opcode::p_extract_vector, bld.def(v2b), inputs[1], Operand::zero());
651 bld.vopc(aco_opcode::v_cmp_neq_f64, bld.def(bld.lm), inputs[2], inputs[2]),
653 Operand::c64(0x4010000000000000u), inputs[2])));
664 src1 = bld.vopc(aco_opcode::v_cmp_lt_f16, bld.def(bld.lm), Operand::c16(nan16), inputs[0]);
665 src0 = bld.vopc(aco_opcode::v_cmp_neq_f16, bld.def(bld.lm), inputs[0], inputs[0]);
672 src1 = bld.vopc(aco_opcode::v_cmp_lt_f32, bld.def(bld.lm), Operand::c32(nan32), inputs[0]);
673 src0 = bld.vopc(aco_opcode::v_cmp_neq_f32, bld.def(bld.lm), inputs[0], inputs[0]);
680 src1 = bld.vopc(aco_opcode::v_cmp_lt_f64, bld.def(bld.lm), Operand::c64(nan64), inputs[0]);
681 src0 = bld.vopc(aco_opcode::v_cmp_neq_f64, bld.def(bld.lm), inputs[0], inputs[0]);
694 Builder::Result tmp = bld.vop2(aco_opcode::v_add_u32, bld.def(v1), inputs[1], inputs[2]);
695 writeout(0, bld.vop2(aco_opcode::v_add_u32, bld.def(v1), inputs[0], tmp));
700 tmp = bld.vop2_e64(aco_opcode::v_add_u32, bld.def(v1), inputs[1], inputs[2]);
702 writeout(1, bld.vop2(aco_opcode::v_add_u32, bld.def(v1), inputs[0], tmp));
707 tmp = bld.vop2(aco_opcode::v_add_u32, bld.def(v1), inputs[1], inputs[2]);
708 tmp = bld.vop2_e64(aco_opcode::v_add_u32, bld.def(v1), inputs[0], tmp);
723 Temp xor0 = fneg(inputs[0]);
730 min = bld.vop2(aco_opcode::v_min_f32, bld.def(v1), Operand::zero(), Operand(inputs[0]));
746 Temp mul = bld.vop2(aco_opcode::v_mul_u32_u24, bld.def(v1), inputs[1], inputs[2]);
747 writeout(0, bld.vadd32(bld.def(v1), inputs[0], mul));
752 mul = bld.vop2(aco_opcode::v_mul_u32_u24, bld.def(v1), inputs[1], inputs[2]);
753 writeout(1, bld.vadd32(bld.def(v1), inputs[0], mul, true).def(1).getTemp());
771 lshl = bld.vop2(aco_opcode::v_lshlrev_b32, bld.def(v1), Operand::c32(3u), Operand(inputs[0]));
772 writeout(0, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
778 Operand a_24bit = Operand(inputs[0]);
781 writeout(1, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
787 Operand b_24bit = Operand(inputs[1]);
790 writeout(2, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
796 writeout(3, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
801 Operand a_16bit = Operand(inputs[0]);
804 writeout(4, bld.vadd32(bld.def(v1), lshl, Operand(inputs[1])));
809 Operand c_24bit = Operand(inputs[2]);
812 writeout(5, bld.vadd32(bld.def(v1), lshl, Operand(inputs[2])));
857 return bld.vop2(aco_opcode::v_cndmask_b32, bld.def(v1), Operand::zero(), val, inputs[1]); in emit_denorm_srcdest()
933 Temp val = emit_denorm_srcdest(cfg.src, inputs[0]);
950 0, bld.vop2(aco_opcode::v_cndmask_b32, bld.def(v1), Operand::zero(), val, inputs[1]));
962 Operand a(inputs[0]);
963 Operand b(inputs[1]);
964 Operand c(inputs[2]);
965 Operand d(inputs[3]);
1060 writeout(0, bld.vop2_dpp(aco_opcode::v_mul_f32, bld.def(v1), one, inputs[0], dpp_row_sl(1)));
1064 writeout(1, bld.vop2_dpp(aco_opcode::v_mul_f32, bld.def(v1), inputs[0], one, dpp_row_sl(1)));
1069 … writeout(2, bld.vop2_dpp(aco_opcode::v_mul_f32, bld.def(v1), literal1, inputs[0], dpp_row_sl(1)));
1075 … writeout(3, bld.vop2_dpp(aco_opcode::v_mul_f32, bld.def(v1), inputs[0], literal2, dpp_row_sl(1)));
1080 Temp b_v = bld.copy(bld.def(v1), inputs[1]);
1081 writeout(4, bld.vop2_dpp(aco_opcode::v_mul_f32, bld.def(v1), b_v, inputs[0], dpp_row_sl(1)));
1085 writeout(5, bld.vop2_dpp(aco_opcode::v_mul_f32, bld.def(v1), inputs[0], b_v, dpp_row_sl(1)));
1099 Temp a = inputs[0];
1100 Temp a16 = inputs[1];
1170 Temp a = inputs[0];
1171 Temp a16 = inputs[1];
1205 Temp a = inputs[0];
1206 Temp a16 = inputs[1];
1258 Temp a = inputs[0];
1259 Temp a16 = inputs[1];
1353 Temp a = inputs[0];
1354 Temp b = inputs[1];
1355 Temp c = inputs[2];
1356 Temp a16 = inputs[3];
1357 Temp b16 = inputs[4];
1395 Temp a16 = inputs[0];
1419 Temp a = inputs[0];
1420 Temp b = inputs[1];
1421 Temp a16 = inputs[2];
1422 Temp b16 = inputs[3];
1468 Temp a = inputs[0];
1469 Temp b = inputs[1];
1470 Temp c = inputs[2];
1471 Temp a16 = inputs[3];
1472 Temp c16 = inputs[4];
1522 Temp a = inputs[0];
1523 Temp b = inputs[1];
1524 Temp c = inputs[2];
1525 Temp a16 = inputs[3];
1526 Temp b16 = inputs[4];
1584 Temp a = inputs[0];
1585 Temp a16 = inputs[1];
1611 Temp a = inputs[0];
1612 Temp a16 = inputs[1];
1676 inputs[0], opsel_lo, opsel_hi)); in vop3p_constant()