1;; Copyright (C) 2011-2020 Free Software Foundation, Inc. 2;; 3;; This file is part of GCC. 4;; 5;; GCC is free software; you can redistribute it and/or modify it 6;; under the terms of the GNU General Public License as published 7;; by the Free Software Foundation; either version 3, or (at your 8;; option) any later version. 9;; 10;; GCC is distributed in the hope that it will be useful, but WITHOUT 11;; ANY WARRANTY; without even the implied warranty of MERCHANTABILITY 12;; or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public 13;; License for more details. 14;; 15;; You should have received a copy of the GNU General Public License 16;; along with GCC; see the file COPYING3. If not see 17;; <http://www.gnu.org/licenses/>. 18;; 19;; This file contains ARM instructions that support fixed-point operations. 20 21(define_insn "add<mode>3" 22 [(set (match_operand:FIXED 0 "s_register_operand" "=l,r") 23 (plus:FIXED (match_operand:FIXED 1 "s_register_operand" "l,r") 24 (match_operand:FIXED 2 "s_register_operand" "l,r")))] 25 "TARGET_32BIT" 26 "add%?\\t%0, %1, %2" 27 [(set_attr "predicable" "yes") 28 (set_attr "predicable_short_it" "yes,no") 29 (set_attr "type" "alu_sreg")]) 30 31(define_expand "add<mode>3" 32 [(set (match_operand:ADDSUB 0 "s_register_operand") 33 (plus:ADDSUB (match_operand:ADDSUB 1 "s_register_operand") 34 (match_operand:ADDSUB 2 "s_register_operand")))] 35 "TARGET_INT_SIMD" 36 { 37 if (ARM_GE_BITS_READ) 38 FAIL; 39 } 40) 41 42(define_insn "*arm_add<mode>3" 43 [(set (match_operand:ADDSUB 0 "s_register_operand" "=r") 44 (plus:ADDSUB (match_operand:ADDSUB 1 "s_register_operand" "r") 45 (match_operand:ADDSUB 2 "s_register_operand" "r")))] 46 "TARGET_INT_SIMD && !ARM_GE_BITS_READ" 47 "sadd<qaddsub_suf>%?\\t%0, %1, %2" 48 [(set_attr "predicable" "yes") 49 (set_attr "type" "alu_dsp_reg")]) 50 51(define_insn "usadd<mode>3" 52 [(set (match_operand:UQADDSUB 0 "s_register_operand" "=r") 53 (us_plus:UQADDSUB (match_operand:UQADDSUB 1 "s_register_operand" "r") 54 (match_operand:UQADDSUB 2 "s_register_operand" "r")))] 55 "TARGET_INT_SIMD" 56 "uqadd<qaddsub_suf>%?\\t%0, %1, %2" 57 [(set_attr "predicable" "yes") 58 (set_attr "type" "alu_dsp_reg")]) 59 60(define_expand "ssadd<mode>3" 61 [(set (match_operand:QADDSUB 0 "s_register_operand") 62 (ss_plus:QADDSUB (match_operand:QADDSUB 1 "s_register_operand") 63 (match_operand:QADDSUB 2 "s_register_operand")))] 64 "TARGET_INT_SIMD" 65 { 66 if (<qaddsub_clob_q>) 67 FAIL; 68 } 69) 70 71(define_insn "*arm_ssadd<mode>3" 72 [(set (match_operand:QADDSUB 0 "s_register_operand" "=r") 73 (ss_plus:QADDSUB (match_operand:QADDSUB 1 "s_register_operand" "r") 74 (match_operand:QADDSUB 2 "s_register_operand" "r")))] 75 "TARGET_INT_SIMD && !<qaddsub_clob_q>" 76 "qadd<qaddsub_suf>%?\\t%0, %1, %2" 77 [(set_attr "predicable" "yes") 78 (set_attr "type" "alu_dsp_reg")]) 79 80(define_insn "sub<mode>3" 81 [(set (match_operand:FIXED 0 "s_register_operand" "=l,r") 82 (minus:FIXED (match_operand:FIXED 1 "s_register_operand" "l,r") 83 (match_operand:FIXED 2 "s_register_operand" "l,r")))] 84 "TARGET_32BIT" 85 "sub%?\\t%0, %1, %2" 86 [(set_attr "predicable" "yes") 87 (set_attr "predicable_short_it" "yes,no") 88 (set_attr "type" "alu_sreg")]) 89 90(define_expand "sub<mode>3" 91 [(set (match_operand:ADDSUB 0 "s_register_operand") 92 (minus:ADDSUB (match_operand:ADDSUB 1 "s_register_operand") 93 (match_operand:ADDSUB 2 "s_register_operand")))] 94 "TARGET_INT_SIMD" 95 { 96 if (ARM_GE_BITS_READ) 97 FAIL; 98 } 99) 100 101(define_insn "*arm_sub<mode>3" 102 [(set (match_operand:ADDSUB 0 "s_register_operand" "=r") 103 (minus:ADDSUB (match_operand:ADDSUB 1 "s_register_operand" "r") 104 (match_operand:ADDSUB 2 "s_register_operand" "r")))] 105 "TARGET_INT_SIMD && !ARM_GE_BITS_READ" 106 "ssub<qaddsub_suf>%?\\t%0, %1, %2" 107 [(set_attr "predicable" "yes") 108 (set_attr "type" "alu_dsp_reg")]) 109 110(define_insn "ussub<mode>3" 111 [(set (match_operand:UQADDSUB 0 "s_register_operand" "=r") 112 (us_minus:UQADDSUB 113 (match_operand:UQADDSUB 1 "s_register_operand" "r") 114 (match_operand:UQADDSUB 2 "s_register_operand" "r")))] 115 "TARGET_INT_SIMD" 116 "uqsub<qaddsub_suf>%?\\t%0, %1, %2" 117 [(set_attr "predicable" "yes") 118 (set_attr "type" "alu_dsp_reg")]) 119 120(define_expand "sssub<mode>3" 121 [(set (match_operand:QADDSUB 0 "s_register_operand") 122 (ss_minus:QADDSUB (match_operand:QADDSUB 1 "s_register_operand") 123 (match_operand:QADDSUB 2 "s_register_operand")))] 124 "TARGET_INT_SIMD" 125 { 126 if (<qaddsub_clob_q>) 127 FAIL; 128 } 129) 130 131(define_insn "*arm_sssub<mode>3" 132 [(set (match_operand:QADDSUB 0 "s_register_operand" "=r") 133 (ss_minus:QADDSUB (match_operand:QADDSUB 1 "s_register_operand" "r") 134 (match_operand:QADDSUB 2 "s_register_operand" "r")))] 135 "TARGET_INT_SIMD && !<qaddsub_clob_q>" 136 "qsub<qaddsub_suf>%?\\t%0, %1, %2" 137 [(set_attr "predicable" "yes") 138 (set_attr "type" "alu_dsp_reg")]) 139 140;; Fractional multiplies. 141 142; Note: none of these do any rounding. 143 144(define_expand "mulqq3" 145 [(set (match_operand:QQ 0 "s_register_operand") 146 (mult:QQ (match_operand:QQ 1 "s_register_operand") 147 (match_operand:QQ 2 "s_register_operand")))] 148 "TARGET_DSP_MULTIPLY && arm_arch_thumb2" 149{ 150 rtx tmp1 = gen_reg_rtx (HImode); 151 rtx tmp2 = gen_reg_rtx (HImode); 152 rtx tmp3 = gen_reg_rtx (SImode); 153 154 emit_insn (gen_extendqihi2 (tmp1, gen_lowpart (QImode, operands[1]))); 155 emit_insn (gen_extendqihi2 (tmp2, gen_lowpart (QImode, operands[2]))); 156 emit_insn (gen_mulhisi3 (tmp3, tmp1, tmp2)); 157 emit_insn (gen_extv (gen_lowpart (SImode, operands[0]), tmp3, GEN_INT (8), 158 GEN_INT (7))); 159 DONE; 160}) 161 162(define_expand "mulhq3" 163 [(set (match_operand:HQ 0 "s_register_operand") 164 (mult:HQ (match_operand:HQ 1 "s_register_operand") 165 (match_operand:HQ 2 "s_register_operand")))] 166 "TARGET_DSP_MULTIPLY && arm_arch_thumb2" 167{ 168 rtx tmp = gen_reg_rtx (SImode); 169 170 emit_insn (gen_mulhisi3 (tmp, gen_lowpart (HImode, operands[1]), 171 gen_lowpart (HImode, operands[2]))); 172 /* We're doing a s.15 * s.15 multiplication, getting an s.30 result. Extract 173 an s.15 value from that. This won't overflow/saturate for _Fract 174 values. */ 175 emit_insn (gen_extv (gen_lowpart (SImode, operands[0]), tmp, 176 GEN_INT (16), GEN_INT (15))); 177 DONE; 178}) 179 180(define_expand "mulsq3" 181 [(set (match_operand:SQ 0 "s_register_operand") 182 (mult:SQ (match_operand:SQ 1 "s_register_operand") 183 (match_operand:SQ 2 "s_register_operand")))] 184 "TARGET_32BIT" 185{ 186 rtx tmp1 = gen_reg_rtx (DImode); 187 rtx tmp2 = gen_reg_rtx (SImode); 188 rtx tmp3 = gen_reg_rtx (SImode); 189 190 /* s.31 * s.31 -> s.62 multiplication. */ 191 emit_insn (gen_mulsidi3 (tmp1, gen_lowpart (SImode, operands[1]), 192 gen_lowpart (SImode, operands[2]))); 193 emit_insn (gen_lshrsi3 (tmp2, gen_lowpart (SImode, tmp1), GEN_INT (31))); 194 emit_insn (gen_ashlsi3 (tmp3, gen_highpart (SImode, tmp1), GEN_INT (1))); 195 emit_insn (gen_iorsi3 (gen_lowpart (SImode, operands[0]), tmp2, tmp3)); 196 197 DONE; 198}) 199 200;; Accumulator multiplies. 201 202(define_expand "mulsa3" 203 [(set (match_operand:SA 0 "s_register_operand") 204 (mult:SA (match_operand:SA 1 "s_register_operand") 205 (match_operand:SA 2 "s_register_operand")))] 206 "TARGET_32BIT" 207{ 208 rtx tmp1 = gen_reg_rtx (DImode); 209 rtx tmp2 = gen_reg_rtx (SImode); 210 rtx tmp3 = gen_reg_rtx (SImode); 211 212 emit_insn (gen_mulsidi3 (tmp1, gen_lowpart (SImode, operands[1]), 213 gen_lowpart (SImode, operands[2]))); 214 emit_insn (gen_lshrsi3 (tmp2, gen_lowpart (SImode, tmp1), GEN_INT (15))); 215 emit_insn (gen_ashlsi3 (tmp3, gen_highpart (SImode, tmp1), GEN_INT (17))); 216 emit_insn (gen_iorsi3 (gen_lowpart (SImode, operands[0]), tmp2, tmp3)); 217 218 DONE; 219}) 220 221(define_expand "mulusa3" 222 [(set (match_operand:USA 0 "s_register_operand") 223 (mult:USA (match_operand:USA 1 "s_register_operand") 224 (match_operand:USA 2 "s_register_operand")))] 225 "TARGET_32BIT" 226{ 227 rtx tmp1 = gen_reg_rtx (DImode); 228 rtx tmp2 = gen_reg_rtx (SImode); 229 rtx tmp3 = gen_reg_rtx (SImode); 230 231 emit_insn (gen_umulsidi3 (tmp1, gen_lowpart (SImode, operands[1]), 232 gen_lowpart (SImode, operands[2]))); 233 emit_insn (gen_lshrsi3 (tmp2, gen_lowpart (SImode, tmp1), GEN_INT (16))); 234 emit_insn (gen_ashlsi3 (tmp3, gen_highpart (SImode, tmp1), GEN_INT (16))); 235 emit_insn (gen_iorsi3 (gen_lowpart (SImode, operands[0]), tmp2, tmp3)); 236 237 DONE; 238}) 239 240;; The code sequence emitted by this insn pattern uses the Q flag, so we need 241;; to bail out when ARM_Q_BIT_READ and resort to a library sequence instead. 242 243(define_expand "ssmulsa3" 244 [(parallel [(set (match_operand:SA 0 "s_register_operand") 245 (ss_mult:SA (match_operand:SA 1 "s_register_operand") 246 (match_operand:SA 2 "s_register_operand"))) 247 (clobber (match_scratch:DI 3)) 248 (clobber (match_scratch:SI 4)) 249 (clobber (reg:CC CC_REGNUM))])] 250 "TARGET_32BIT && arm_arch6" 251 { 252 if (ARM_Q_BIT_READ) 253 FAIL; 254 } 255) 256 257(define_insn "*arm_ssmulsa3" 258 [(set (match_operand:SA 0 "s_register_operand" "=r") 259 (ss_mult:SA (match_operand:SA 1 "s_register_operand" "r") 260 (match_operand:SA 2 "s_register_operand" "r"))) 261 (clobber (match_scratch:DI 3 "=r")) 262 (clobber (match_scratch:SI 4 "=r")) 263 (clobber (reg:CC CC_REGNUM))] 264 "TARGET_32BIT && arm_arch6 && !ARM_Q_BIT_READ" 265{ 266 /* s16.15 * s16.15 -> s32.30. */ 267 output_asm_insn ("smull\\t%Q3, %R3, %1, %2", operands); 268 269 if (TARGET_ARM) 270 output_asm_insn ("msr\\tAPSR_nzcvq, #0", operands); 271 else 272 { 273 output_asm_insn ("mov\\t%4, #0", operands); 274 output_asm_insn ("msr\\tAPSR_nzcvq, %4", operands); 275 } 276 277 /* We have: 278 31 high word 0 31 low word 0 279 280 [ S i i .... i i i ] [ i f f f ... f f ] 281 | 282 v 283 [ S i ... i f ... f f ] 284 285 Need 16 integral bits, so saturate at 15th bit of high word. */ 286 287 output_asm_insn ("ssat\\t%R3, #15, %R3", operands); 288 output_asm_insn ("mrs\\t%4, APSR", operands); 289 output_asm_insn ("tst\\t%4, #1<<27", operands); 290 if (arm_restrict_it) 291 { 292 output_asm_insn ("mvn\\t%4, %R3, asr #32", operands); 293 output_asm_insn ("it\\tne", operands); 294 output_asm_insn ("movne\\t%Q3, %4", operands); 295 } 296 else 297 { 298 if (TARGET_THUMB2) 299 output_asm_insn ("it\\tne", operands); 300 output_asm_insn ("mvnne\\t%Q3, %R3, asr #32", operands); 301 } 302 output_asm_insn ("mov\\t%0, %Q3, lsr #15", operands); 303 output_asm_insn ("orr\\t%0, %0, %R3, asl #17", operands); 304 return ""; 305} 306 [(set_attr "conds" "clob") 307 (set_attr "type" "multiple") 308 (set (attr "length") 309 (if_then_else (eq_attr "is_thumb" "yes") 310 (if_then_else (match_test "arm_restrict_it") 311 (const_int 40) 312 (const_int 38)) 313 (const_int 32)))]) 314 315(define_expand "usmulusa3" 316 [(parallel [(set (match_operand:USA 0 "s_register_operand") 317 (us_mult:USA (match_operand:USA 1 "s_register_operand") 318 (match_operand:USA 2 "s_register_operand"))) 319 (clobber (match_scratch:DI 3)) 320 (clobber (match_scratch:SI 4)) 321 (clobber (reg:CC CC_REGNUM))])] 322 "TARGET_32BIT && arm_arch6" 323 { 324 if (ARM_Q_BIT_READ) 325 FAIL; 326 } 327) 328 329(define_insn "*arm_usmulusa3" 330 [(set (match_operand:USA 0 "s_register_operand" "=r") 331 (us_mult:USA (match_operand:USA 1 "s_register_operand" "r") 332 (match_operand:USA 2 "s_register_operand" "r"))) 333 (clobber (match_scratch:DI 3 "=r")) 334 (clobber (match_scratch:SI 4 "=r")) 335 (clobber (reg:CC CC_REGNUM))] 336 "TARGET_32BIT && arm_arch6 && !ARM_Q_BIT_READ" 337{ 338 /* 16.16 * 16.16 -> 32.32. */ 339 output_asm_insn ("umull\\t%Q3, %R3, %1, %2", operands); 340 341 if (TARGET_ARM) 342 output_asm_insn ("msr\\tAPSR_nzcvq, #0", operands); 343 else 344 { 345 output_asm_insn ("mov\\t%4, #0", operands); 346 output_asm_insn ("msr\\tAPSR_nzcvq, %4", operands); 347 } 348 349 /* We have: 350 31 high word 0 31 low word 0 351 352 [ i i i .... i i i ] [ f f f f ... f f ] 353 | 354 v 355 [ i i ... i f ... f f ] 356 357 Need 16 integral bits, so saturate at 16th bit of high word. */ 358 359 output_asm_insn ("usat\\t%R3, #16, %R3", operands); 360 output_asm_insn ("mrs\\t%4, APSR", operands); 361 output_asm_insn ("tst\\t%4, #1<<27", operands); 362 if (arm_restrict_it) 363 { 364 output_asm_insn ("sbfx\\t%4, %R3, #15, #1", operands); 365 output_asm_insn ("it\\tne", operands); 366 output_asm_insn ("movne\\t%Q3, %4", operands); 367 } 368 else 369 { 370 if (TARGET_THUMB2) 371 output_asm_insn ("it\\tne", operands); 372 output_asm_insn ("sbfxne\\t%Q3, %R3, #15, #1", operands); 373 } 374 output_asm_insn ("lsr\\t%0, %Q3, #16", operands); 375 output_asm_insn ("orr\\t%0, %0, %R3, asl #16", operands); 376 return ""; 377} 378 [(set_attr "conds" "clob") 379 (set_attr "type" "multiple") 380 (set (attr "length") 381 (if_then_else (eq_attr "is_thumb" "yes") 382 (if_then_else (match_test "arm_restrict_it") 383 (const_int 40) 384 (const_int 38)) 385 (const_int 32)))]) 386 387(define_expand "mulha3" 388 [(set (match_operand:HA 0 "s_register_operand") 389 (mult:HA (match_operand:HA 1 "s_register_operand") 390 (match_operand:HA 2 "s_register_operand")))] 391 "TARGET_DSP_MULTIPLY && arm_arch_thumb2" 392{ 393 rtx tmp = gen_reg_rtx (SImode); 394 395 emit_insn (gen_mulhisi3 (tmp, gen_lowpart (HImode, operands[1]), 396 gen_lowpart (HImode, operands[2]))); 397 emit_insn (gen_extv (gen_lowpart (SImode, operands[0]), tmp, GEN_INT (16), 398 GEN_INT (7))); 399 400 DONE; 401}) 402 403(define_expand "muluha3" 404 [(set (match_operand:UHA 0 "s_register_operand") 405 (mult:UHA (match_operand:UHA 1 "s_register_operand") 406 (match_operand:UHA 2 "s_register_operand")))] 407 "TARGET_DSP_MULTIPLY" 408{ 409 rtx tmp1 = gen_reg_rtx (SImode); 410 rtx tmp2 = gen_reg_rtx (SImode); 411 rtx tmp3 = gen_reg_rtx (SImode); 412 413 /* 8.8 * 8.8 -> 16.16 multiply. */ 414 emit_insn (gen_zero_extendhisi2 (tmp1, gen_lowpart (HImode, operands[1]))); 415 emit_insn (gen_zero_extendhisi2 (tmp2, gen_lowpart (HImode, operands[2]))); 416 emit_insn (gen_mulsi3 (tmp3, tmp1, tmp2)); 417 emit_insn (gen_extzv (gen_lowpart (SImode, operands[0]), tmp3, 418 GEN_INT (16), GEN_INT (8))); 419 420 DONE; 421}) 422 423(define_expand "ssmulha3" 424 [(set (match_operand:HA 0 "s_register_operand") 425 (ss_mult:HA (match_operand:HA 1 "s_register_operand") 426 (match_operand:HA 2 "s_register_operand")))] 427 "TARGET_32BIT && TARGET_DSP_MULTIPLY && arm_arch6" 428{ 429 if (ARM_Q_BIT_READ) 430 FAIL; 431 rtx tmp = gen_reg_rtx (SImode); 432 rtx rshift; 433 434 emit_insn (gen_mulhisi3 (tmp, gen_lowpart (HImode, operands[1]), 435 gen_lowpart (HImode, operands[2]))); 436 437 rshift = gen_rtx_ASHIFTRT (SImode, tmp, GEN_INT (7)); 438 439 emit_insn (gen_rtx_SET (gen_lowpart (HImode, operands[0]), 440 gen_rtx_SS_TRUNCATE (HImode, rshift))); 441 442 DONE; 443}) 444 445(define_expand "usmuluha3" 446 [(set (match_operand:UHA 0 "s_register_operand") 447 (us_mult:UHA (match_operand:UHA 1 "s_register_operand") 448 (match_operand:UHA 2 "s_register_operand")))] 449 "TARGET_INT_SIMD" 450{ 451 if (ARM_Q_BIT_READ) 452 FAIL; 453 454 rtx tmp1 = gen_reg_rtx (SImode); 455 rtx tmp2 = gen_reg_rtx (SImode); 456 rtx tmp3 = gen_reg_rtx (SImode); 457 rtx rshift_tmp = gen_reg_rtx (SImode); 458 459 /* Note: there's no smul[bt][bt] equivalent for unsigned multiplies. Use a 460 normal 32x32->32-bit multiply instead. */ 461 emit_insn (gen_zero_extendhisi2 (tmp1, gen_lowpart (HImode, operands[1]))); 462 emit_insn (gen_zero_extendhisi2 (tmp2, gen_lowpart (HImode, operands[2]))); 463 464 emit_insn (gen_mulsi3 (tmp3, tmp1, tmp2)); 465 466 /* The operand to "usat" is signed, so we cannot use the "..., asr #8" 467 form of that instruction since the multiplication result TMP3 may have the 468 top bit set, thus be negative and saturate to zero. Use a separate 469 logical right-shift instead. */ 470 emit_insn (gen_lshrsi3 (rshift_tmp, tmp3, GEN_INT (8))); 471 emit_insn (gen_arm_usatsihi (gen_lowpart (HImode, operands[0]), rshift_tmp)); 472 473 DONE; 474}) 475 476(define_insn "arm_ssatsihi_shift" 477 [(set (match_operand:HI 0 "s_register_operand" "=r") 478 (ss_truncate:HI (match_operator:SI 1 "sat_shift_operator" 479 [(match_operand:SI 2 "s_register_operand" "r") 480 (match_operand:SI 3 "immediate_operand" "I")])))] 481 "TARGET_32BIT && arm_arch6 && !ARM_Q_BIT_READ" 482 "ssat%?\\t%0, #16, %2%S1" 483 [(set_attr "predicable" "yes") 484 (set_attr "shift" "1") 485 (set_attr "type" "alu_shift_imm")]) 486 487(define_insn "arm_usatsihi" 488 [(set (match_operand:HI 0 "s_register_operand" "=r") 489 (us_truncate:HI (match_operand:SI 1 "s_register_operand")))] 490 "TARGET_INT_SIMD && !ARM_Q_BIT_READ" 491 "usat%?\\t%0, #16, %1" 492 [(set_attr "predicable" "yes") 493 (set_attr "type" "alu_imm")] 494) 495