28#define DEBUG_TYPE "riscv-vl-optimizer"
29#define PASS_NAME "RISC-V VL Optimizer"
53 std::optional<MachineOperand> getMinimumVLForUser(
MachineOperand &UserOp);
63char RISCVVLOptimizer::ID = 0;
69 return new RISCVVLOptimizer();
75 return RISCV::VRRegClass.contains(R);
85 std::optional<std::pair<unsigned, bool>>
EMUL;
100 return A.Log2EEW ==
B.Log2EEW &&
A.EMUL->first ==
B.EMUL->first &&
101 A.EMUL->second ==
B.EMUL->second;
105 return A.Log2EEW ==
B.Log2EEW;
115 OS <<
"EMUL: unknown\n";
128 const std::optional<OperandInfo> &OI) {
137namespace RISCVVType {
140static std::pair<unsigned, bool>
152 unsigned MISEW = 1 << MILog2SEW;
154 unsigned EEW = 1 << Log2EEW;
157 unsigned Num = EEW, Denom = MISEW;
158 int GCD = MILMULIsFractional ? std::gcd(Num, Denom * MILMUL)
159 : std::gcd(Num * MILMUL, Denom);
160 Num = MILMULIsFractional ? Num / GCD : Num * MILMUL / GCD;
161 Denom = MILMULIsFractional ? Denom * MILMUL / GCD : Denom / GCD;
162 return std::make_pair(Num > Denom ? Num : Denom, Denom > Num);
178 unsigned MISEW = 1 << MILog2SEW;
179 unsigned EEW = MISEW / Factor;
180 unsigned Log2EEW =
Log2_32(EEW);
193 return Desc.operands()[MO.
getOperandNo()].RegClass == RISCV::VMV0RegClassID;
196static std::optional<unsigned>
200 RISCVVPseudosTable::getPseudoInfo(
MI.getOpcode());
201 assert(
RVV &&
"Could not find MI in PseudoTable");
214 if (HasPassthru && MO.
getOperandNo() ==
MI.getNumExplicitDefs() &&
215 (MO.
getReg() != RISCV::NoRegister))
226 switch (
RVV->BaseInstr) {
230 case RISCV::VSETIVLI:
250 case RISCV::VLSE16_V:
251 case RISCV::VSSE16_V:
255 case RISCV::VLSE32_V:
256 case RISCV::VSSE32_V:
260 case RISCV::VLSE64_V:
261 case RISCV::VSSE64_V:
267 case RISCV::VLUXEI8_V:
268 case RISCV::VLOXEI8_V:
269 case RISCV::VSUXEI8_V:
270 case RISCV::VSOXEI8_V: {
275 case RISCV::VLUXEI16_V:
276 case RISCV::VLOXEI16_V:
277 case RISCV::VSUXEI16_V:
278 case RISCV::VSOXEI16_V: {
283 case RISCV::VLUXEI32_V:
284 case RISCV::VLOXEI32_V:
285 case RISCV::VSUXEI32_V:
286 case RISCV::VSOXEI32_V: {
291 case RISCV::VLUXEI64_V:
292 case RISCV::VLOXEI64_V:
293 case RISCV::VSUXEI64_V:
294 case RISCV::VSOXEI64_V: {
307 case RISCV::VRSUB_VI:
308 case RISCV::VRSUB_VX:
332 case RISCV::VMINU_VV:
333 case RISCV::VMINU_VX:
336 case RISCV::VMAXU_VV:
337 case RISCV::VMAXU_VX:
344 case RISCV::VMULH_VV:
345 case RISCV::VMULH_VX:
346 case RISCV::VMULHU_VV:
347 case RISCV::VMULHU_VX:
348 case RISCV::VMULHSU_VV:
349 case RISCV::VMULHSU_VX:
352 case RISCV::VDIVU_VV:
353 case RISCV::VDIVU_VX:
356 case RISCV::VREMU_VV:
357 case RISCV::VREMU_VX:
362 case RISCV::VMACC_VV:
363 case RISCV::VMACC_VX:
364 case RISCV::VNMSAC_VV:
365 case RISCV::VNMSAC_VX:
366 case RISCV::VMADD_VV:
367 case RISCV::VMADD_VX:
368 case RISCV::VNMSUB_VV:
369 case RISCV::VNMSUB_VX:
374 case RISCV::VMERGE_VIM:
375 case RISCV::VMERGE_VVM:
376 case RISCV::VMERGE_VXM:
377 case RISCV::VADC_VIM:
378 case RISCV::VADC_VVM:
379 case RISCV::VADC_VXM:
380 case RISCV::VSBC_VVM:
381 case RISCV::VSBC_VXM:
390 case RISCV::VSADDU_VI:
391 case RISCV::VSADDU_VV:
392 case RISCV::VSADDU_VX:
393 case RISCV::VSADD_VI:
394 case RISCV::VSADD_VV:
395 case RISCV::VSADD_VX:
396 case RISCV::VSSUBU_VV:
397 case RISCV::VSSUBU_VX:
398 case RISCV::VSSUB_VV:
399 case RISCV::VSSUB_VX:
400 case RISCV::VAADDU_VV:
401 case RISCV::VAADDU_VX:
402 case RISCV::VAADD_VV:
403 case RISCV::VAADD_VX:
404 case RISCV::VASUBU_VV:
405 case RISCV::VASUBU_VX:
406 case RISCV::VASUB_VV:
407 case RISCV::VASUB_VX:
411 case RISCV::VSMUL_VV:
412 case RISCV::VSMUL_VX:
415 case RISCV::VSSRL_VI:
416 case RISCV::VSSRL_VV:
417 case RISCV::VSSRL_VX:
418 case RISCV::VSSRA_VI:
419 case RISCV::VSSRA_VV:
420 case RISCV::VSSRA_VX:
427 case RISCV::VFMV_F_S:
428 case RISCV::VFMV_S_F:
431 case RISCV::VSLIDEUP_VI:
432 case RISCV::VSLIDEUP_VX:
433 case RISCV::VSLIDEDOWN_VI:
434 case RISCV::VSLIDEDOWN_VX:
435 case RISCV::VSLIDE1UP_VX:
436 case RISCV::VFSLIDE1UP_VF:
437 case RISCV::VSLIDE1DOWN_VX:
438 case RISCV::VFSLIDE1DOWN_VF:
441 case RISCV::VRGATHER_VI:
442 case RISCV::VRGATHER_VV:
443 case RISCV::VRGATHER_VX:
446 case RISCV::VCOMPRESS_VM:
450 case RISCV::VFADD_VF:
451 case RISCV::VFADD_VV:
452 case RISCV::VFSUB_VF:
453 case RISCV::VFSUB_VV:
454 case RISCV::VFRSUB_VF:
456 case RISCV::VFMUL_VF:
457 case RISCV::VFMUL_VV:
458 case RISCV::VFDIV_VF:
459 case RISCV::VFDIV_VV:
460 case RISCV::VFRDIV_VF:
462 case RISCV::VFSQRT_V:
464 case RISCV::VFRSQRT7_V:
466 case RISCV::VFREC7_V:
468 case RISCV::VFMIN_VF:
469 case RISCV::VFMIN_VV:
470 case RISCV::VFMAX_VF:
471 case RISCV::VFMAX_VV:
473 case RISCV::VFSGNJ_VF:
474 case RISCV::VFSGNJ_VV:
475 case RISCV::VFSGNJN_VV:
476 case RISCV::VFSGNJN_VF:
477 case RISCV::VFSGNJX_VF:
478 case RISCV::VFSGNJX_VV:
480 case RISCV::VFCLASS_V:
482 case RISCV::VFMV_V_F:
484 case RISCV::VFCVT_XU_F_V:
485 case RISCV::VFCVT_X_F_V:
486 case RISCV::VFCVT_RTZ_XU_F_V:
487 case RISCV::VFCVT_RTZ_X_F_V:
488 case RISCV::VFCVT_F_XU_V:
489 case RISCV::VFCVT_F_X_V:
491 case RISCV::VFMERGE_VFM:
495 case RISCV::VFIRST_M:
500 case RISCV::VWADDU_VV:
501 case RISCV::VWADDU_VX:
502 case RISCV::VWSUBU_VV:
503 case RISCV::VWSUBU_VX:
504 case RISCV::VWADD_VV:
505 case RISCV::VWADD_VX:
506 case RISCV::VWSUB_VV:
507 case RISCV::VWSUB_VX:
508 case RISCV::VWSLL_VI:
511 case RISCV::VWMUL_VV:
512 case RISCV::VWMUL_VX:
513 case RISCV::VWMULSU_VV:
514 case RISCV::VWMULSU_VX:
515 case RISCV::VWMULU_VV:
516 case RISCV::VWMULU_VX:
522 case RISCV::VWMACCU_VV:
523 case RISCV::VWMACCU_VX:
524 case RISCV::VWMACC_VV:
525 case RISCV::VWMACC_VX:
526 case RISCV::VWMACCSU_VV:
527 case RISCV::VWMACCSU_VX:
528 case RISCV::VWMACCUS_VX:
530 case RISCV::VFWMACC_VF:
531 case RISCV::VFWMACC_VV:
532 case RISCV::VFWNMACC_VF:
533 case RISCV::VFWNMACC_VV:
534 case RISCV::VFWMSAC_VF:
535 case RISCV::VFWMSAC_VV:
536 case RISCV::VFWNMSAC_VF:
537 case RISCV::VFWNMSAC_VV:
540 case RISCV::VFWADD_VV:
541 case RISCV::VFWADD_VF:
542 case RISCV::VFWSUB_VV:
543 case RISCV::VFWSUB_VF:
545 case RISCV::VFWMUL_VF:
546 case RISCV::VFWMUL_VV:
548 case RISCV::VFWCVT_XU_F_V:
549 case RISCV::VFWCVT_X_F_V:
550 case RISCV::VFWCVT_RTZ_XU_F_V:
551 case RISCV::VFWCVT_RTZ_X_F_V:
552 case RISCV::VFWCVT_F_XU_V:
553 case RISCV::VFWCVT_F_X_V:
554 case RISCV::VFWCVT_F_F_V:
555 case RISCV::VFWCVTBF16_F_F_V:
556 return IsMODef ? MILog2SEW + 1 : MILog2SEW;
559 case RISCV::VWADDU_WV:
560 case RISCV::VWADDU_WX:
561 case RISCV::VWSUBU_WV:
562 case RISCV::VWSUBU_WX:
563 case RISCV::VWADD_WV:
564 case RISCV::VWADD_WX:
565 case RISCV::VWSUB_WV:
566 case RISCV::VWSUB_WX:
568 case RISCV::VFWADD_WF:
569 case RISCV::VFWADD_WV:
570 case RISCV::VFWSUB_WF:
571 case RISCV::VFWSUB_WV: {
572 bool IsOp1 = (HasPassthru && !IsTied) ? MO.
getOperandNo() == 2
574 bool TwoTimes = IsMODef || IsOp1;
575 return TwoTimes ? MILog2SEW + 1 : MILog2SEW;
579 case RISCV::VZEXT_VF2:
580 case RISCV::VSEXT_VF2:
582 case RISCV::VZEXT_VF4:
583 case RISCV::VSEXT_VF4:
585 case RISCV::VZEXT_VF8:
586 case RISCV::VSEXT_VF8:
591 case RISCV::VNSRL_WX:
592 case RISCV::VNSRL_WI:
593 case RISCV::VNSRL_WV:
594 case RISCV::VNSRA_WI:
595 case RISCV::VNSRA_WV:
596 case RISCV::VNSRA_WX:
599 case RISCV::VNCLIPU_WI:
600 case RISCV::VNCLIPU_WV:
601 case RISCV::VNCLIPU_WX:
602 case RISCV::VNCLIP_WI:
603 case RISCV::VNCLIP_WV:
604 case RISCV::VNCLIP_WX:
606 case RISCV::VFNCVT_XU_F_W:
607 case RISCV::VFNCVT_X_F_W:
608 case RISCV::VFNCVT_RTZ_XU_F_W:
609 case RISCV::VFNCVT_RTZ_X_F_W:
610 case RISCV::VFNCVT_F_XU_W:
611 case RISCV::VFNCVT_F_X_W:
612 case RISCV::VFNCVT_F_F_W:
613 case RISCV::VFNCVT_ROD_F_F_W:
614 case RISCV::VFNCVTBF16_F_F_W: {
617 bool TwoTimes = IsOp1;
618 return TwoTimes ? MILog2SEW + 1 : MILog2SEW;
630 case RISCV::VMAND_MM:
631 case RISCV::VMNAND_MM:
632 case RISCV::VMANDN_MM:
633 case RISCV::VMXOR_MM:
635 case RISCV::VMNOR_MM:
636 case RISCV::VMORN_MM:
637 case RISCV::VMXNOR_MM:
640 case RISCV::VMSOF_M: {
647 case RISCV::VIOTA_M: {
655 case RISCV::VMSEQ_VI:
656 case RISCV::VMSEQ_VV:
657 case RISCV::VMSEQ_VX:
658 case RISCV::VMSNE_VI:
659 case RISCV::VMSNE_VV:
660 case RISCV::VMSNE_VX:
661 case RISCV::VMSLTU_VV:
662 case RISCV::VMSLTU_VX:
663 case RISCV::VMSLT_VV:
664 case RISCV::VMSLT_VX:
665 case RISCV::VMSLEU_VV:
666 case RISCV::VMSLEU_VI:
667 case RISCV::VMSLEU_VX:
668 case RISCV::VMSLE_VV:
669 case RISCV::VMSLE_VI:
670 case RISCV::VMSLE_VX:
671 case RISCV::VMSGTU_VI:
672 case RISCV::VMSGTU_VX:
673 case RISCV::VMSGT_VI:
674 case RISCV::VMSGT_VX:
677 case RISCV::VMADC_VIM:
678 case RISCV::VMADC_VVM:
679 case RISCV::VMADC_VXM:
680 case RISCV::VMSBC_VVM:
681 case RISCV::VMSBC_VXM:
683 case RISCV::VMADC_VV:
684 case RISCV::VMADC_VI:
685 case RISCV::VMADC_VX:
686 case RISCV::VMSBC_VV:
687 case RISCV::VMSBC_VX:
690 case RISCV::VMFEQ_VF:
691 case RISCV::VMFEQ_VV:
692 case RISCV::VMFNE_VF:
693 case RISCV::VMFNE_VV:
694 case RISCV::VMFLT_VF:
695 case RISCV::VMFLT_VV:
696 case RISCV::VMFLE_VF:
697 case RISCV::VMFLE_VV:
698 case RISCV::VMFGT_VF:
699 case RISCV::VMFGE_VF: {
707 case RISCV::VREDAND_VS:
708 case RISCV::VREDMAX_VS:
709 case RISCV::VREDMAXU_VS:
710 case RISCV::VREDMIN_VS:
711 case RISCV::VREDMINU_VS:
712 case RISCV::VREDOR_VS:
713 case RISCV::VREDSUM_VS:
714 case RISCV::VREDXOR_VS:
716 case RISCV::VFREDMAX_VS:
717 case RISCV::VFREDMIN_VS:
718 case RISCV::VFREDOSUM_VS:
719 case RISCV::VFREDUSUM_VS: {
726 case RISCV::VWREDSUM_VS:
727 case RISCV::VWREDSUMU_VS:
729 case RISCV::VFWREDOSUM_VS:
730 case RISCV::VFWREDUSUM_VS: {
732 return TwoTimes ? MILog2SEW + 1 : MILog2SEW;
740static std::optional<OperandInfo>
744 RISCVVPseudosTable::getPseudoInfo(
MI.getOpcode());
745 assert(
RVV &&
"Could not find MI in PseudoTable");
751 switch (
RVV->BaseInstr) {
758 case RISCV::VREDAND_VS:
759 case RISCV::VREDMAX_VS:
760 case RISCV::VREDMAXU_VS:
761 case RISCV::VREDMIN_VS:
762 case RISCV::VREDMINU_VS:
763 case RISCV::VREDOR_VS:
764 case RISCV::VREDSUM_VS:
765 case RISCV::VREDXOR_VS:
766 case RISCV::VWREDSUM_VS:
767 case RISCV::VWREDSUMU_VS:
768 case RISCV::VFWREDOSUM_VS:
769 case RISCV::VFWREDUSUM_VS:
785 RISCVVPseudosTable::getPseudoInfo(
MI.getOpcode());
790 switch (
RVV->BaseInstr) {
797 case RISCV::VLSE16_V:
799 case RISCV::VLSE32_V:
801 case RISCV::VLSE64_V:
803 case RISCV::VLUXEI8_V:
804 case RISCV::VLOXEI8_V:
805 case RISCV::VLUXEI16_V:
806 case RISCV::VLOXEI16_V:
807 case RISCV::VLUXEI32_V:
808 case RISCV::VLOXEI32_V:
809 case RISCV::VLUXEI64_V:
810 case RISCV::VLOXEI64_V: {
812 if (MMO->isVolatile())
823 case RISCV::VRSUB_VI:
824 case RISCV::VRSUB_VX:
846 case RISCV::VWADDU_VV:
847 case RISCV::VWADDU_VX:
848 case RISCV::VWSUBU_VV:
849 case RISCV::VWSUBU_VX:
850 case RISCV::VWADD_VV:
851 case RISCV::VWADD_VX:
852 case RISCV::VWSUB_VV:
853 case RISCV::VWSUB_VX:
854 case RISCV::VWADDU_WV:
855 case RISCV::VWADDU_WX:
856 case RISCV::VWSUBU_WV:
857 case RISCV::VWSUBU_WX:
858 case RISCV::VWADD_WV:
859 case RISCV::VWADD_WX:
860 case RISCV::VWSUB_WV:
861 case RISCV::VWSUB_WX:
863 case RISCV::VZEXT_VF2:
864 case RISCV::VSEXT_VF2:
865 case RISCV::VZEXT_VF4:
866 case RISCV::VSEXT_VF4:
867 case RISCV::VZEXT_VF8:
868 case RISCV::VSEXT_VF8:
871 case RISCV::VMADC_VV:
872 case RISCV::VMADC_VI:
873 case RISCV::VMADC_VX:
874 case RISCV::VMSBC_VV:
875 case RISCV::VMSBC_VX:
877 case RISCV::VNSRL_WX:
878 case RISCV::VNSRL_WI:
879 case RISCV::VNSRL_WV:
880 case RISCV::VNSRA_WI:
881 case RISCV::VNSRA_WV:
882 case RISCV::VNSRA_WX:
884 case RISCV::VMSEQ_VI:
885 case RISCV::VMSEQ_VV:
886 case RISCV::VMSEQ_VX:
887 case RISCV::VMSNE_VI:
888 case RISCV::VMSNE_VV:
889 case RISCV::VMSNE_VX:
890 case RISCV::VMSLTU_VV:
891 case RISCV::VMSLTU_VX:
892 case RISCV::VMSLT_VV:
893 case RISCV::VMSLT_VX:
894 case RISCV::VMSLEU_VV:
895 case RISCV::VMSLEU_VI:
896 case RISCV::VMSLEU_VX:
897 case RISCV::VMSLE_VV:
898 case RISCV::VMSLE_VI:
899 case RISCV::VMSLE_VX:
900 case RISCV::VMSGTU_VI:
901 case RISCV::VMSGTU_VX:
902 case RISCV::VMSGT_VI:
903 case RISCV::VMSGT_VX:
905 case RISCV::VMINU_VV:
906 case RISCV::VMINU_VX:
909 case RISCV::VMAXU_VV:
910 case RISCV::VMAXU_VX:
916 case RISCV::VMULH_VV:
917 case RISCV::VMULH_VX:
918 case RISCV::VMULHU_VV:
919 case RISCV::VMULHU_VX:
920 case RISCV::VMULHSU_VV:
921 case RISCV::VMULHSU_VX:
923 case RISCV::VDIVU_VV:
924 case RISCV::VDIVU_VX:
927 case RISCV::VREMU_VV:
928 case RISCV::VREMU_VX:
932 case RISCV::VWMUL_VV:
933 case RISCV::VWMUL_VX:
934 case RISCV::VWMULSU_VV:
935 case RISCV::VWMULSU_VX:
936 case RISCV::VWMULU_VV:
937 case RISCV::VWMULU_VX:
939 case RISCV::VMACC_VV:
940 case RISCV::VMACC_VX:
941 case RISCV::VNMSAC_VV:
942 case RISCV::VNMSAC_VX:
943 case RISCV::VMADD_VV:
944 case RISCV::VMADD_VX:
945 case RISCV::VNMSUB_VV:
946 case RISCV::VNMSUB_VX:
948 case RISCV::VMERGE_VIM:
949 case RISCV::VMERGE_VVM:
950 case RISCV::VMERGE_VXM:
952 case RISCV::VADC_VIM:
953 case RISCV::VADC_VVM:
954 case RISCV::VADC_VXM:
956 case RISCV::VWMACCU_VV:
957 case RISCV::VWMACCU_VX:
958 case RISCV::VWMACC_VV:
959 case RISCV::VWMACC_VX:
960 case RISCV::VWMACCSU_VV:
961 case RISCV::VWMACCSU_VX:
962 case RISCV::VWMACCUS_VX:
971 case RISCV::VAADDU_VV:
972 case RISCV::VAADDU_VX:
973 case RISCV::VAADD_VV:
974 case RISCV::VAADD_VX:
975 case RISCV::VASUBU_VV:
976 case RISCV::VASUBU_VX:
977 case RISCV::VASUB_VV:
978 case RISCV::VASUB_VX:
981 case RISCV::VWSLL_VI:
990 case RISCV::VMAND_MM:
991 case RISCV::VMNAND_MM:
992 case RISCV::VMANDN_MM:
993 case RISCV::VMXOR_MM:
995 case RISCV::VMNOR_MM:
996 case RISCV::VMORN_MM:
997 case RISCV::VMXNOR_MM:
1000 case RISCV::VMSOF_M:
1001 case RISCV::VIOTA_M:
1004 case RISCV::VFADD_VF:
1005 case RISCV::VFADD_VV:
1006 case RISCV::VFSUB_VF:
1007 case RISCV::VFSUB_VV:
1008 case RISCV::VFRSUB_VF:
1010 case RISCV::VFWADD_VV:
1011 case RISCV::VFWADD_VF:
1012 case RISCV::VFWSUB_VV:
1013 case RISCV::VFWSUB_VF:
1014 case RISCV::VFWADD_WF:
1015 case RISCV::VFWADD_WV:
1016 case RISCV::VFWSUB_WF:
1017 case RISCV::VFWSUB_WV:
1019 case RISCV::VFMUL_VF:
1020 case RISCV::VFMUL_VV:
1021 case RISCV::VFDIV_VF:
1022 case RISCV::VFDIV_VV:
1023 case RISCV::VFRDIV_VF:
1025 case RISCV::VFWMUL_VF:
1026 case RISCV::VFWMUL_VV:
1028 case RISCV::VMFEQ_VF:
1029 case RISCV::VMFEQ_VV:
1030 case RISCV::VMFNE_VF:
1031 case RISCV::VMFNE_VV:
1032 case RISCV::VMFLT_VF:
1033 case RISCV::VMFLT_VV:
1034 case RISCV::VMFLE_VF:
1035 case RISCV::VMFLE_VV:
1036 case RISCV::VMFGT_VF:
1037 case RISCV::VMFGE_VF:
1039 case RISCV::VFCVT_XU_F_V:
1040 case RISCV::VFCVT_X_F_V:
1041 case RISCV::VFCVT_RTZ_XU_F_V:
1042 case RISCV::VFCVT_RTZ_X_F_V:
1043 case RISCV::VFCVT_F_XU_V:
1044 case RISCV::VFCVT_F_X_V:
1046 case RISCV::VFWCVT_XU_F_V:
1047 case RISCV::VFWCVT_X_F_V:
1048 case RISCV::VFWCVT_RTZ_XU_F_V:
1049 case RISCV::VFWCVT_RTZ_X_F_V:
1050 case RISCV::VFWCVT_F_XU_V:
1051 case RISCV::VFWCVT_F_X_V:
1052 case RISCV::VFWCVT_F_F_V:
1053 case RISCV::VFWCVTBF16_F_F_V:
1055 case RISCV::VFNCVT_XU_F_W:
1056 case RISCV::VFNCVT_X_F_W:
1057 case RISCV::VFNCVT_RTZ_XU_F_W:
1058 case RISCV::VFNCVT_RTZ_X_F_W:
1059 case RISCV::VFNCVT_F_XU_W:
1060 case RISCV::VFNCVT_F_X_W:
1061 case RISCV::VFNCVT_F_F_W:
1062 case RISCV::VFNCVT_ROD_F_F_W:
1063 case RISCV::VFNCVTBF16_F_F_W:
1074 RISCVVPseudosTable::getPseudoInfo(
MI->getOpcode());
1079 switch (
RVV->BaseInstr) {
1081 case RISCV::VREDAND_VS:
1082 case RISCV::VREDMAX_VS:
1083 case RISCV::VREDMAXU_VS:
1084 case RISCV::VREDMIN_VS:
1085 case RISCV::VREDMINU_VS:
1086 case RISCV::VREDOR_VS:
1087 case RISCV::VREDSUM_VS:
1088 case RISCV::VREDXOR_VS:
1089 case RISCV::VWREDSUM_VS:
1090 case RISCV::VWREDSUMU_VS:
1091 case RISCV::VFREDMAX_VS:
1092 case RISCV::VFREDMIN_VS:
1093 case RISCV::VFREDOSUM_VS:
1094 case RISCV::VFREDUSUM_VS:
1095 case RISCV::VFWREDOSUM_VS:
1096 case RISCV::VFWREDUSUM_VS:
1098 case RISCV::VMV_X_S:
1099 case RISCV::VFMV_F_S:
1109 RISCVVPseudosTable::getPseudoInfo(
MI.getOpcode());
1113 switch (
RVV->BaseInstr) {
1116 case RISCV::VSLIDEDOWN_VI:
1117 case RISCV::VSLIDEDOWN_VX:
1118 case RISCV::VSLIDE1DOWN_VX:
1119 case RISCV::VFSLIDE1DOWN_VF:
1123 case RISCV::VRGATHER_VI:
1124 case RISCV::VRGATHER_VV:
1125 case RISCV::VRGATHER_VX:
1126 case RISCV::VRGATHEREI16_VV:
1134bool RISCVVLOptimizer::isCandidate(
const MachineInstr &
MI)
const {
1138 if (
MI.getNumDefs() != 1)
1153 unsigned PassthruOpIdx =
MI.getNumExplicitDefs();
1155 MI.getOperand(PassthruOpIdx).getReg() != RISCV::NoRegister) {
1157 dbgs() <<
" Not a candidate because it uses non-undef passthru"
1158 " with non-VLMAX VL\n");
1166 LLVM_DEBUG(
dbgs() <<
" Not a candidate because VL is already 1\n");
1170 if (
MI.mayRaiseFPException()) {
1171 LLVM_DEBUG(
dbgs() <<
"Not a candidate because may raise FP exception\n");
1188 LLVM_DEBUG(
dbgs() <<
"Not a candidate due to unsupported instruction\n");
1192 LLVM_DEBUG(
dbgs() <<
"Found a candidate for VL reduction: " <<
MI <<
"\n");
1196std::optional<MachineOperand>
1204 return std::nullopt;
1212 assert(RISCV::VRRegClass.hasSubClassEq(RC) &&
1213 "Expect LMUL 1 register class for vector as scalar operands!");
1214 LLVM_DEBUG(
dbgs() <<
" Used this operand as a scalar operand\n");
1223 "Did not expect X0 VL");
1227std::optional<MachineOperand> RISCVVLOptimizer::checkUsers(
MachineInstr &
MI) {
1232 std::optional<MachineOperand> CommonVL;
1233 for (
auto &UserOp :
MRI->use_operands(
MI.getOperand(0).getReg())) {
1237 LLVM_DEBUG(
dbgs() <<
" Abort because used by unsafe instruction\n");
1238 return std::nullopt;
1243 LLVM_DEBUG(
dbgs() <<
" Abort because user used as tied operand\n");
1244 return std::nullopt;
1247 auto VLOp = getMinimumVLForUser(UserOp);
1249 return std::nullopt;
1257 LLVM_DEBUG(
dbgs() <<
" Abort because cannot determine a common VL\n");
1258 return std::nullopt;
1263 return std::nullopt;
1267 std::optional<OperandInfo> ProducerInfo =
1269 if (!ConsumerInfo || !ProducerInfo) {
1270 LLVM_DEBUG(
dbgs() <<
" Abort due to unknown operand information.\n");
1271 LLVM_DEBUG(
dbgs() <<
" ConsumerInfo is: " << ConsumerInfo <<
"\n");
1272 LLVM_DEBUG(
dbgs() <<
" ProducerInfo is: " << ProducerInfo <<
"\n");
1273 return std::nullopt;
1279 if ((IsVectorOpUsedAsScalarOp &&
1281 (!IsVectorOpUsedAsScalarOp &&
1285 <<
" Abort due to incompatible information for EMUL or EEW.\n");
1286 LLVM_DEBUG(
dbgs() <<
" ConsumerInfo is: " << ConsumerInfo <<
"\n");
1287 LLVM_DEBUG(
dbgs() <<
" ProducerInfo is: " << ProducerInfo <<
"\n");
1288 return std::nullopt;
1295bool RISCVVLOptimizer::tryReduceVL(
MachineInstr &OrigMI) {
1297 Worklist.
insert(&OrigMI);
1299 bool MadeChange =
false;
1300 while (!Worklist.
empty()) {
1307 auto CommonVL = checkUsers(
MI);
1311 assert((CommonVL->isImm() || CommonVL->getReg().isVirtual()) &&
1312 "Expected VL to be an Imm or virtual Reg");
1322 if (CommonVL->isImm()) {
1324 << CommonVL->getImm() <<
" for " <<
MI <<
"\n");
1328 if (!MDT->dominates(VLMI, &
MI))
1331 dbgs() <<
" Reduce VL from " << VLOp <<
" to "
1332 <<
printReg(CommonVL->getReg(),
MRI->getTargetRegisterInfo())
1333 <<
" for " <<
MI <<
"\n");
1342 for (
auto &
Op :
MI.operands()) {
1343 if (!
Op.isReg() || !
Op.isUse() || !
Op.getReg().isVirtual())
1366 MDT = &getAnalysis<MachineDominatorTreeWrapperPass>().getDomTree();
1369 if (!
ST.hasVInstructions())
1372 bool MadeChange =
false;
1379 MadeChange |= tryReduceVL(
MI);
unsigned const MachineRegisterInfo * MRI
MachineInstrBuilder MachineInstrBuilder & DefMI
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
#define LLVM_ATTRIBUTE_UNUSED
static bool isCandidate(const MachineInstr *MI, Register &DefedReg, Register FrameReg)
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
static bool mayReadPastVL(const MachineInstr &MI)
Return true if MI may read elements past VL.
static LLVM_ATTRIBUTE_UNUSED raw_ostream & operator<<(raw_ostream &OS, const OperandInfo &OI)
static unsigned getIntegerExtensionOperandEEW(unsigned Factor, const MachineInstr &MI, const MachineOperand &MO)
Dest has EEW=SEW.
static bool isVectorOpUsedAsScalarOp(MachineOperand &MO)
Return true if MO is a vector operand but is used as a scalar operand.
static std::optional< unsigned > getOperandLog2EEW(const MachineOperand &MO, const MachineRegisterInfo *MRI)
static bool isVectorRegClass(Register R, const MachineRegisterInfo *MRI)
Return true if R is a physical or virtual vector register, false otherwise.
static bool isSupportedInstr(const MachineInstr &MI)
Return true if this optimization should consider MI for VL reduction.
static bool isMaskOperand(const MachineInstr &MI, const MachineOperand &MO, const MachineRegisterInfo *MRI)
Check whether MO is a mask operand of MI.
static std::optional< OperandInfo > getOperandInfo(const MachineOperand &MO, const MachineRegisterInfo *MRI)
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file implements a set that has insertion order iteration characteristics.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
void setPreservesCFG()
This function should be called by the pass, iff they do not:
This class represents an Operation in the Expression.
FunctionPass class - This class is used to implement most global optimizations.
Describe properties that are true of each instruction in the target description file.
reverse_iterator rbegin()
Analysis pass which computes a MachineDominatorTree.
DominatorTree Class - Concrete subclass of DominatorTreeBase that is used to compute a normal dominat...
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
virtual bool runOnMachineFunction(MachineFunction &MF)=0
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
Representation of each machine instruction.
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
const MachineOperand & getOperand(unsigned i) const
A description of a memory reference used in the backend.
MachineOperand class - Representation of each machine instruction operand.
unsigned getOperandNo() const
Returns the index of this operand in the instruction that it belongs to.
bool isReg() const
isReg - Tests if this is a MO_Register operand.
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
void ChangeToImmediate(int64_t ImmVal, unsigned TargetFlags=0)
ChangeToImmediate - Replace this operand with a new immediate operand of the specified value.
void ChangeToRegister(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isDebug=false)
ChangeToRegister - Replace this operand with a new register operand of the specified value.
MachineInstr * getParent()
getParent - Return the instruction that this operand belongs to.
static MachineOperand CreateImm(int64_t Val)
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
virtual StringRef getPassName() const
getPassName - Return a nice clean name for a pass.
Wrapper class representing virtual and physical registers.
A vector that has set insertion semantics.
bool empty() const
Determine if the SetVector is empty or not.
bool insert(const value_type &X)
Insert a new element into the SetVector.
value_type pop_back_val()
StringRef - Represent a constant reference to a string, i.e.
const uint8_t TSFlags
Configurable target specific flags.
This class implements an extremely fast bulk output stream that can only output to a stream.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
static bool isTiedPseudo(uint64_t TSFlags)
static unsigned getVLOpNum(const MCInstrDesc &Desc)
static VLMUL getLMul(uint64_t TSFlags)
static bool hasVLOp(uint64_t TSFlags)
static unsigned getSEWOpNum(const MCInstrDesc &Desc)
static bool hasSEWOp(uint64_t TSFlags)
static bool isFirstDefTiedToFirstUse(const MCInstrDesc &Desc)
static bool isVRegClass(uint64_t TSFlags)
static std::pair< unsigned, bool > getEMULEqualsEEWDivSEWTimesLMUL(unsigned Log2EEW, const MachineInstr &MI)
Return EMUL = (EEW / SEW) * LMUL where EEW comes from Log2EEW and LMUL and SEW are from the TSFlags o...
std::pair< unsigned, bool > decodeVLMUL(RISCVII::VLMUL VLMUL)
bool isVLKnownLE(const MachineOperand &LHS, const MachineOperand &RHS)
Given two VL operands, do we know that LHS <= RHS?
static constexpr int64_t VLMaxSentinel
This is an optimization pass for GlobalISel generic memory operations.
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
FunctionPass * createRISCVVLOptimizerPass()
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Printable printReg(Register Reg, const TargetRegisterInfo *TRI=nullptr, unsigned SubIdx=0, const MachineRegisterInfo *MRI=nullptr)
Prints virtual and physical registers with or without a TRI instance.
Represents the EMUL and EEW of a MachineOperand.
static bool EEWAreEqual(const OperandInfo &A, const OperandInfo &B)
OperandInfo(std::pair< unsigned, bool > EMUL, unsigned Log2EEW)
OperandInfo(unsigned Log2EEW)
void print(raw_ostream &OS) const
static bool EMULAndEEWAreEqual(const OperandInfo &A, const OperandInfo &B)
OperandInfo(RISCVII::VLMUL EMUL, unsigned Log2EEW)
std::optional< std::pair< unsigned, bool > > EMUL
Description of the encoding of one expression Op.