816 if (builtinID == Builtin::BI__builtin_cpu_is) {
817 cgm.errorNYI(
expr->getSourceRange(),
"__builtin_cpu_is");
818 return mlir::Value{};
820 if (builtinID == Builtin::BI__builtin_cpu_supports) {
821 cgm.errorNYI(
expr->getSourceRange(),
"__builtin_cpu_supports");
822 return mlir::Value{};
824 if (builtinID == Builtin::BI__builtin_cpu_init) {
825 cgm.errorNYI(
expr->getSourceRange(),
"__builtin_cpu_init");
826 return mlir::Value{};
841 unsigned iceArguments = 0;
846 for (
auto [idx, arg] : llvm::enumerate(
expr->arguments()))
850 mlir::Type
voidTy = builder.getVoidTy();
855 case X86::BI_mm_clflush:
856 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
857 "x86.sse2.clflush",
voidTy, ops[0]);
858 case X86::BI_mm_lfence:
859 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
860 "x86.sse2.lfence",
voidTy);
861 case X86::BI_mm_pause:
862 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
863 "x86.sse2.pause",
voidTy);
864 case X86::BI_mm_mfence:
865 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
866 "x86.sse2.mfence",
voidTy);
867 case X86::BI_mm_sfence:
868 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
869 "x86.sse.sfence",
voidTy);
870 case X86::BI_mm_prefetch:
871 case X86::BI_m_prefetch:
872 case X86::BI_m_prefetchw:
875 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
"x86.rdtsc",
876 builder.getUInt64Ty());
877 case X86::BI__builtin_ia32_rdtscp: {
878 mlir::Location loc =
getLoc(
expr->getExprLoc());
879 mlir::Type i64Ty = builder.getUInt64Ty();
880 mlir::Type i32Ty = builder.getUInt32Ty();
881 mlir::Type structTy = builder.getAnonRecordTy({i64Ty, i32Ty});
883 builder.emitIntrinsicCallOp(loc,
"x86.rdtscp", structTy);
886 mlir::Value processorId =
887 cir::ExtractMemberOp::create(builder, loc, i32Ty, result, 1);
892 return cir::ExtractMemberOp::create(builder, loc, i64Ty, result, 0);
894 case X86::BI__builtin_ia32_lzcnt_u16:
895 case X86::BI__builtin_ia32_lzcnt_u32:
896 case X86::BI__builtin_ia32_lzcnt_u64: {
897 mlir::Location loc =
getLoc(
expr->getExprLoc());
898 mlir::Value isZeroPoison = builder.getFalse(loc);
899 return builder.emitIntrinsicCallOp(loc,
"ctlz", ops[0].
getType(),
900 mlir::ValueRange{ops[0], isZeroPoison});
902 case X86::BI__builtin_ia32_tzcnt_u16:
903 case X86::BI__builtin_ia32_tzcnt_u32:
904 case X86::BI__builtin_ia32_tzcnt_u64: {
905 mlir::Location loc =
getLoc(
expr->getExprLoc());
906 mlir::Value isZeroPoison = builder.getFalse(loc);
907 return builder.emitIntrinsicCallOp(loc,
"cttz", ops[0].
getType(),
908 mlir::ValueRange{ops[0], isZeroPoison});
910 case X86::BI__builtin_ia32_undef128:
911 case X86::BI__builtin_ia32_undef256:
912 case X86::BI__builtin_ia32_undef512:
920 case X86::BI__builtin_ia32_vec_ext_v4hi:
921 case X86::BI__builtin_ia32_vec_ext_v16qi:
922 case X86::BI__builtin_ia32_vec_ext_v8hi:
923 case X86::BI__builtin_ia32_vec_ext_v4si:
924 case X86::BI__builtin_ia32_vec_ext_v4sf:
925 case X86::BI__builtin_ia32_vec_ext_v2di:
926 case X86::BI__builtin_ia32_vec_ext_v32qi:
927 case X86::BI__builtin_ia32_vec_ext_v16hi:
928 case X86::BI__builtin_ia32_vec_ext_v8si:
929 case X86::BI__builtin_ia32_vec_ext_v4di: {
933 index &= numElts - 1;
935 cir::ConstantOp indexVal =
940 return cir::VecExtractOp::create(builder,
getLoc(
expr->getExprLoc()),
943 case X86::BI__builtin_ia32_vec_set_v4hi:
944 case X86::BI__builtin_ia32_vec_set_v16qi:
945 case X86::BI__builtin_ia32_vec_set_v8hi:
946 case X86::BI__builtin_ia32_vec_set_v4si:
947 case X86::BI__builtin_ia32_vec_set_v2di:
948 case X86::BI__builtin_ia32_vec_set_v32qi:
949 case X86::BI__builtin_ia32_vec_set_v16hi:
950 case X86::BI__builtin_ia32_vec_set_v8si:
951 case X86::BI__builtin_ia32_vec_set_v4di: {
955 case X86::BI__builtin_ia32_kunpckhi:
957 "x86.avx512.kunpackb", ops);
958 case X86::BI__builtin_ia32_kunpcksi:
960 "x86.avx512.kunpackw", ops);
961 case X86::BI__builtin_ia32_kunpckdi:
963 "x86.avx512.kunpackd", ops);
964 case X86::BI_mm_setcsr:
965 case X86::BI__builtin_ia32_ldmxcsr: {
966 mlir::Location loc =
getLoc(
expr->getExprLoc());
968 builder.createStore(loc, ops[0], tmp);
969 return builder.emitIntrinsicCallOp(loc,
"x86.sse.ldmxcsr",
972 case X86::BI_mm_getcsr:
973 case X86::BI__builtin_ia32_stmxcsr: {
974 mlir::Location loc =
getLoc(
expr->getExprLoc());
976 builder.emitIntrinsicCallOp(loc,
"x86.sse.stmxcsr", builder.getVoidTy(),
978 return builder.createLoad(loc, tmp);
980 case X86::BI__builtin_ia32_xsave:
981 case X86::BI__builtin_ia32_xsave64:
982 case X86::BI__builtin_ia32_xrstor:
983 case X86::BI__builtin_ia32_xrstor64:
984 case X86::BI__builtin_ia32_xsaveopt:
985 case X86::BI__builtin_ia32_xsaveopt64:
986 case X86::BI__builtin_ia32_xrstors:
987 case X86::BI__builtin_ia32_xrstors64:
988 case X86::BI__builtin_ia32_xsavec:
989 case X86::BI__builtin_ia32_xsavec64:
990 case X86::BI__builtin_ia32_xsaves:
991 case X86::BI__builtin_ia32_xsaves64:
992 case X86::BI__builtin_ia32_xsetbv:
993 case X86::BI_xsetbv: {
994 mlir::Location loc =
getLoc(
expr->getExprLoc());
995 StringRef intrinsicName;
998 llvm_unreachable(
"Unexpected builtin");
999 case X86::BI__builtin_ia32_xsave:
1000 intrinsicName =
"x86.xsave";
1002 case X86::BI__builtin_ia32_xsave64:
1003 intrinsicName =
"x86.xsave64";
1005 case X86::BI__builtin_ia32_xrstor:
1006 intrinsicName =
"x86.xrstor";
1008 case X86::BI__builtin_ia32_xrstor64:
1009 intrinsicName =
"x86.xrstor64";
1011 case X86::BI__builtin_ia32_xsaveopt:
1012 intrinsicName =
"x86.xsaveopt";
1014 case X86::BI__builtin_ia32_xsaveopt64:
1015 intrinsicName =
"x86.xsaveopt64";
1017 case X86::BI__builtin_ia32_xrstors:
1018 intrinsicName =
"x86.xrstors";
1020 case X86::BI__builtin_ia32_xrstors64:
1021 intrinsicName =
"x86.xrstors64";
1023 case X86::BI__builtin_ia32_xsavec:
1024 intrinsicName =
"x86.xsavec";
1026 case X86::BI__builtin_ia32_xsavec64:
1027 intrinsicName =
"x86.xsavec64";
1029 case X86::BI__builtin_ia32_xsaves:
1030 intrinsicName =
"x86.xsaves";
1032 case X86::BI__builtin_ia32_xsaves64:
1033 intrinsicName =
"x86.xsaves64";
1035 case X86::BI__builtin_ia32_xsetbv:
1036 case X86::BI_xsetbv:
1037 intrinsicName =
"x86.xsetbv";
1045 mlir::Type i32Ty = builder.getSInt32Ty();
1048 cir::ConstantOp shift32 = builder.getSInt64(32, loc);
1049 mlir::Value mhi = builder.createShift(loc, ops[1], shift32.getResult(),
1051 mhi = builder.createIntCast(mhi, i32Ty);
1054 mlir::Value mlo = builder.createIntCast(ops[1], i32Ty);
1056 return builder.emitIntrinsicCallOp(loc, intrinsicName,
voidTy,
1057 mlir::ValueRange{ops[0], mhi, mlo});
1059 case X86::BI__builtin_ia32_xgetbv:
1060 case X86::BI_xgetbv:
1063 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
"x86.xgetbv",
1064 builder.getUInt64Ty(), ops[0]);
1065 case X86::BI__builtin_ia32_storedqudi128_mask:
1066 case X86::BI__builtin_ia32_storedqusi128_mask:
1067 case X86::BI__builtin_ia32_storedquhi128_mask:
1068 case X86::BI__builtin_ia32_storedquqi128_mask:
1069 case X86::BI__builtin_ia32_storeupd128_mask:
1070 case X86::BI__builtin_ia32_storeups128_mask:
1071 case X86::BI__builtin_ia32_storedqudi256_mask:
1072 case X86::BI__builtin_ia32_storedqusi256_mask:
1073 case X86::BI__builtin_ia32_storedquhi256_mask:
1074 case X86::BI__builtin_ia32_storedquqi256_mask:
1075 case X86::BI__builtin_ia32_storeupd256_mask:
1076 case X86::BI__builtin_ia32_storeups256_mask:
1077 case X86::BI__builtin_ia32_storedqudi512_mask:
1078 case X86::BI__builtin_ia32_storedqusi512_mask:
1079 case X86::BI__builtin_ia32_storedquhi512_mask:
1080 case X86::BI__builtin_ia32_storedquqi512_mask:
1081 case X86::BI__builtin_ia32_storeupd512_mask:
1082 case X86::BI__builtin_ia32_storeups512_mask:
1083 case X86::BI__builtin_ia32_storesbf16128_mask:
1084 case X86::BI__builtin_ia32_storesh128_mask:
1085 case X86::BI__builtin_ia32_storess128_mask:
1086 case X86::BI__builtin_ia32_storesd128_mask:
1087 cgm.errorNYI(
expr->getSourceRange(),
1088 std::string(
"unimplemented x86 builtin call: ") +
1089 getContext().BuiltinInfo.getName(builtinID));
1090 return mlir::Value{};
1091 case X86::BI__builtin_ia32_cvtmask2b128:
1092 case X86::BI__builtin_ia32_cvtmask2b256:
1093 case X86::BI__builtin_ia32_cvtmask2b512:
1094 case X86::BI__builtin_ia32_cvtmask2w128:
1095 case X86::BI__builtin_ia32_cvtmask2w256:
1096 case X86::BI__builtin_ia32_cvtmask2w512:
1097 case X86::BI__builtin_ia32_cvtmask2d128:
1098 case X86::BI__builtin_ia32_cvtmask2d256:
1099 case X86::BI__builtin_ia32_cvtmask2d512:
1100 case X86::BI__builtin_ia32_cvtmask2q128:
1101 case X86::BI__builtin_ia32_cvtmask2q256:
1102 case X86::BI__builtin_ia32_cvtmask2q512:
1106 case X86::BI__builtin_ia32_cvtb2mask128:
1107 case X86::BI__builtin_ia32_cvtb2mask256:
1108 case X86::BI__builtin_ia32_cvtb2mask512:
1109 case X86::BI__builtin_ia32_cvtw2mask128:
1110 case X86::BI__builtin_ia32_cvtw2mask256:
1111 case X86::BI__builtin_ia32_cvtw2mask512:
1112 case X86::BI__builtin_ia32_cvtd2mask128:
1113 case X86::BI__builtin_ia32_cvtd2mask256:
1114 case X86::BI__builtin_ia32_cvtd2mask512:
1115 case X86::BI__builtin_ia32_cvtq2mask128:
1116 case X86::BI__builtin_ia32_cvtq2mask256:
1117 case X86::BI__builtin_ia32_cvtq2mask512:
1120 case X86::BI__builtin_ia32_cvtdq2ps512_mask:
1121 case X86::BI__builtin_ia32_cvtqq2ps512_mask:
1122 case X86::BI__builtin_ia32_cvtqq2pd512_mask:
1123 case X86::BI__builtin_ia32_vcvtw2ph512_mask:
1124 case X86::BI__builtin_ia32_vcvtdq2ph512_mask:
1125 case X86::BI__builtin_ia32_vcvtqq2ph512_mask:
1126 case X86::BI__builtin_ia32_cvtudq2ps512_mask:
1127 case X86::BI__builtin_ia32_cvtuqq2ps512_mask:
1128 case X86::BI__builtin_ia32_cvtuqq2pd512_mask:
1129 case X86::BI__builtin_ia32_vcvtuw2ph512_mask:
1130 case X86::BI__builtin_ia32_vcvtudq2ph512_mask:
1131 case X86::BI__builtin_ia32_vcvtuqq2ph512_mask:
1132 case X86::BI__builtin_ia32_vfmaddsh3_mask:
1133 case X86::BI__builtin_ia32_vfmaddss3_mask:
1134 case X86::BI__builtin_ia32_vfmaddsd3_mask:
1135 case X86::BI__builtin_ia32_vfmaddsh3_maskz:
1136 case X86::BI__builtin_ia32_vfmaddss3_maskz:
1137 case X86::BI__builtin_ia32_vfmaddsd3_maskz:
1138 case X86::BI__builtin_ia32_vfmaddsh3_mask3:
1139 case X86::BI__builtin_ia32_vfmaddss3_mask3:
1140 case X86::BI__builtin_ia32_vfmaddsd3_mask3:
1141 case X86::BI__builtin_ia32_vfmsubsh3_mask3:
1142 case X86::BI__builtin_ia32_vfmsubss3_mask3:
1143 case X86::BI__builtin_ia32_vfmsubsd3_mask3:
1144 case X86::BI__builtin_ia32_vfmaddph512_mask:
1145 case X86::BI__builtin_ia32_vfmaddph512_maskz:
1146 case X86::BI__builtin_ia32_vfmaddph512_mask3:
1147 case X86::BI__builtin_ia32_vfmaddps512_mask:
1148 case X86::BI__builtin_ia32_vfmaddps512_maskz:
1149 case X86::BI__builtin_ia32_vfmaddps512_mask3:
1150 case X86::BI__builtin_ia32_vfmsubps512_mask3:
1151 case X86::BI__builtin_ia32_vfmaddpd512_mask:
1152 case X86::BI__builtin_ia32_vfmaddpd512_maskz:
1153 case X86::BI__builtin_ia32_vfmaddpd512_mask3:
1154 case X86::BI__builtin_ia32_vfmsubpd512_mask3:
1155 case X86::BI__builtin_ia32_vfmsubph512_mask3:
1156 case X86::BI__builtin_ia32_vfmaddsubph512_mask:
1157 case X86::BI__builtin_ia32_vfmaddsubph512_maskz:
1158 case X86::BI__builtin_ia32_vfmaddsubph512_mask3:
1159 case X86::BI__builtin_ia32_vfmsubaddph512_mask3:
1160 case X86::BI__builtin_ia32_vfmaddsubps512_mask:
1161 case X86::BI__builtin_ia32_vfmaddsubps512_maskz:
1162 case X86::BI__builtin_ia32_vfmaddsubps512_mask3:
1163 case X86::BI__builtin_ia32_vfmsubaddps512_mask3:
1164 case X86::BI__builtin_ia32_vfmaddsubpd512_mask:
1165 case X86::BI__builtin_ia32_vfmaddsubpd512_maskz:
1166 case X86::BI__builtin_ia32_vfmaddsubpd512_mask3:
1167 case X86::BI__builtin_ia32_vfmsubaddpd512_mask3:
1168 case X86::BI__builtin_ia32_movdqa32store128_mask:
1169 case X86::BI__builtin_ia32_movdqa64store128_mask:
1170 case X86::BI__builtin_ia32_storeaps128_mask:
1171 case X86::BI__builtin_ia32_storeapd128_mask:
1172 case X86::BI__builtin_ia32_movdqa32store256_mask:
1173 case X86::BI__builtin_ia32_movdqa64store256_mask:
1174 case X86::BI__builtin_ia32_storeaps256_mask:
1175 case X86::BI__builtin_ia32_storeapd256_mask:
1176 case X86::BI__builtin_ia32_movdqa32store512_mask:
1177 case X86::BI__builtin_ia32_movdqa64store512_mask:
1178 case X86::BI__builtin_ia32_storeaps512_mask:
1179 case X86::BI__builtin_ia32_storeapd512_mask:
1180 cgm.errorNYI(
expr->getSourceRange(),
1181 std::string(
"unimplemented X86 builtin call: ") +
1182 getContext().BuiltinInfo.getName(builtinID));
1185 case X86::BI__builtin_ia32_loadups128_mask:
1186 case X86::BI__builtin_ia32_loadups256_mask:
1187 case X86::BI__builtin_ia32_loadups512_mask:
1188 case X86::BI__builtin_ia32_loadupd128_mask:
1189 case X86::BI__builtin_ia32_loadupd256_mask:
1190 case X86::BI__builtin_ia32_loadupd512_mask:
1191 case X86::BI__builtin_ia32_loaddquqi128_mask:
1192 case X86::BI__builtin_ia32_loaddquqi256_mask:
1193 case X86::BI__builtin_ia32_loaddquqi512_mask:
1194 case X86::BI__builtin_ia32_loaddquhi128_mask:
1195 case X86::BI__builtin_ia32_loaddquhi256_mask:
1196 case X86::BI__builtin_ia32_loaddquhi512_mask:
1197 case X86::BI__builtin_ia32_loaddqusi128_mask:
1198 case X86::BI__builtin_ia32_loaddqusi256_mask:
1199 case X86::BI__builtin_ia32_loaddqusi512_mask:
1200 case X86::BI__builtin_ia32_loaddqudi128_mask:
1201 case X86::BI__builtin_ia32_loaddqudi256_mask:
1202 case X86::BI__builtin_ia32_loaddqudi512_mask:
1203 case X86::BI__builtin_ia32_loadsbf16128_mask:
1204 case X86::BI__builtin_ia32_loadsh128_mask:
1205 case X86::BI__builtin_ia32_loadss128_mask:
1206 case X86::BI__builtin_ia32_loadsd128_mask:
1210 case X86::BI__builtin_ia32_loadaps128_mask:
1211 case X86::BI__builtin_ia32_loadaps256_mask:
1212 case X86::BI__builtin_ia32_loadaps512_mask:
1213 case X86::BI__builtin_ia32_loadapd128_mask:
1214 case X86::BI__builtin_ia32_loadapd256_mask:
1215 case X86::BI__builtin_ia32_loadapd512_mask:
1216 case X86::BI__builtin_ia32_movdqa32load128_mask:
1217 case X86::BI__builtin_ia32_movdqa32load256_mask:
1218 case X86::BI__builtin_ia32_movdqa32load512_mask:
1219 case X86::BI__builtin_ia32_movdqa64load128_mask:
1220 case X86::BI__builtin_ia32_movdqa64load256_mask:
1221 case X86::BI__builtin_ia32_movdqa64load512_mask:
1225 .getTypeAlignInChars(
expr->getArg(1)->getType())
1229 case X86::BI__builtin_ia32_expandloaddf128_mask:
1230 case X86::BI__builtin_ia32_expandloaddf256_mask:
1231 case X86::BI__builtin_ia32_expandloaddf512_mask:
1232 case X86::BI__builtin_ia32_expandloadsf128_mask:
1233 case X86::BI__builtin_ia32_expandloadsf256_mask:
1234 case X86::BI__builtin_ia32_expandloadsf512_mask:
1235 case X86::BI__builtin_ia32_expandloaddi128_mask:
1236 case X86::BI__builtin_ia32_expandloaddi256_mask:
1237 case X86::BI__builtin_ia32_expandloaddi512_mask:
1238 case X86::BI__builtin_ia32_expandloadsi128_mask:
1239 case X86::BI__builtin_ia32_expandloadsi256_mask:
1240 case X86::BI__builtin_ia32_expandloadsi512_mask:
1241 case X86::BI__builtin_ia32_expandloadhi128_mask:
1242 case X86::BI__builtin_ia32_expandloadhi256_mask:
1243 case X86::BI__builtin_ia32_expandloadhi512_mask:
1244 case X86::BI__builtin_ia32_expandloadqi128_mask:
1245 case X86::BI__builtin_ia32_expandloadqi256_mask:
1246 case X86::BI__builtin_ia32_expandloadqi512_mask: {
1247 cgm.errorNYI(
expr->getSourceRange(),
1248 std::string(
"unimplemented X86 builtin call: ") +
1249 getContext().BuiltinInfo.getName(builtinID));
1252 case X86::BI__builtin_ia32_compressstoredf128_mask:
1253 case X86::BI__builtin_ia32_compressstoredf256_mask:
1254 case X86::BI__builtin_ia32_compressstoredf512_mask:
1255 case X86::BI__builtin_ia32_compressstoresf128_mask:
1256 case X86::BI__builtin_ia32_compressstoresf256_mask:
1257 case X86::BI__builtin_ia32_compressstoresf512_mask:
1258 case X86::BI__builtin_ia32_compressstoredi128_mask:
1259 case X86::BI__builtin_ia32_compressstoredi256_mask:
1260 case X86::BI__builtin_ia32_compressstoredi512_mask:
1261 case X86::BI__builtin_ia32_compressstoresi128_mask:
1262 case X86::BI__builtin_ia32_compressstoresi256_mask:
1263 case X86::BI__builtin_ia32_compressstoresi512_mask:
1264 case X86::BI__builtin_ia32_compressstorehi128_mask:
1265 case X86::BI__builtin_ia32_compressstorehi256_mask:
1266 case X86::BI__builtin_ia32_compressstorehi512_mask:
1267 case X86::BI__builtin_ia32_compressstoreqi128_mask:
1268 case X86::BI__builtin_ia32_compressstoreqi256_mask:
1269 case X86::BI__builtin_ia32_compressstoreqi512_mask:
1271 case X86::BI__builtin_ia32_expanddf128_mask:
1272 case X86::BI__builtin_ia32_expanddf256_mask:
1273 case X86::BI__builtin_ia32_expanddf512_mask:
1274 case X86::BI__builtin_ia32_expandsf128_mask:
1275 case X86::BI__builtin_ia32_expandsf256_mask:
1276 case X86::BI__builtin_ia32_expandsf512_mask:
1277 case X86::BI__builtin_ia32_expanddi128_mask:
1278 case X86::BI__builtin_ia32_expanddi256_mask:
1279 case X86::BI__builtin_ia32_expanddi512_mask:
1280 case X86::BI__builtin_ia32_expandsi128_mask:
1281 case X86::BI__builtin_ia32_expandsi256_mask:
1282 case X86::BI__builtin_ia32_expandsi512_mask:
1283 case X86::BI__builtin_ia32_expandhi128_mask:
1284 case X86::BI__builtin_ia32_expandhi256_mask:
1285 case X86::BI__builtin_ia32_expandhi512_mask:
1286 case X86::BI__builtin_ia32_expandqi128_mask:
1287 case X86::BI__builtin_ia32_expandqi256_mask:
1288 case X86::BI__builtin_ia32_expandqi512_mask: {
1289 mlir::Location loc =
getLoc(
expr->getExprLoc());
1291 "x86.avx512.mask.expand");
1293 case X86::BI__builtin_ia32_compressdf128_mask:
1294 case X86::BI__builtin_ia32_compressdf256_mask:
1295 case X86::BI__builtin_ia32_compressdf512_mask:
1296 case X86::BI__builtin_ia32_compresssf128_mask:
1297 case X86::BI__builtin_ia32_compresssf256_mask:
1298 case X86::BI__builtin_ia32_compresssf512_mask:
1299 case X86::BI__builtin_ia32_compressdi128_mask:
1300 case X86::BI__builtin_ia32_compressdi256_mask:
1301 case X86::BI__builtin_ia32_compressdi512_mask:
1302 case X86::BI__builtin_ia32_compresssi128_mask:
1303 case X86::BI__builtin_ia32_compresssi256_mask:
1304 case X86::BI__builtin_ia32_compresssi512_mask:
1305 case X86::BI__builtin_ia32_compresshi128_mask:
1306 case X86::BI__builtin_ia32_compresshi256_mask:
1307 case X86::BI__builtin_ia32_compresshi512_mask:
1308 case X86::BI__builtin_ia32_compressqi128_mask:
1309 case X86::BI__builtin_ia32_compressqi256_mask:
1310 case X86::BI__builtin_ia32_compressqi512_mask: {
1311 mlir::Location loc =
getLoc(
expr->getExprLoc());
1313 "x86.avx512.mask.compress");
1315 case X86::BI__builtin_ia32_gather3div2df:
1316 case X86::BI__builtin_ia32_gather3div2di:
1317 case X86::BI__builtin_ia32_gather3div4df:
1318 case X86::BI__builtin_ia32_gather3div4di:
1319 case X86::BI__builtin_ia32_gather3div4sf:
1320 case X86::BI__builtin_ia32_gather3div4si:
1321 case X86::BI__builtin_ia32_gather3div8sf:
1322 case X86::BI__builtin_ia32_gather3div8si:
1323 case X86::BI__builtin_ia32_gather3siv2df:
1324 case X86::BI__builtin_ia32_gather3siv2di:
1325 case X86::BI__builtin_ia32_gather3siv4df:
1326 case X86::BI__builtin_ia32_gather3siv4di:
1327 case X86::BI__builtin_ia32_gather3siv4sf:
1328 case X86::BI__builtin_ia32_gather3siv4si:
1329 case X86::BI__builtin_ia32_gather3siv8sf:
1330 case X86::BI__builtin_ia32_gather3siv8si:
1331 case X86::BI__builtin_ia32_gathersiv8df:
1332 case X86::BI__builtin_ia32_gathersiv16sf:
1333 case X86::BI__builtin_ia32_gatherdiv8df:
1334 case X86::BI__builtin_ia32_gatherdiv16sf:
1335 case X86::BI__builtin_ia32_gathersiv8di:
1336 case X86::BI__builtin_ia32_gathersiv16si:
1337 case X86::BI__builtin_ia32_gatherdiv8di:
1338 case X86::BI__builtin_ia32_gatherdiv16si: {
1339 StringRef intrinsicName;
1340 switch (builtinID) {
1342 llvm_unreachable(
"Unexpected builtin");
1343 case X86::BI__builtin_ia32_gather3div2df:
1344 intrinsicName =
"x86.avx512.mask.gather3div2.df";
1346 case X86::BI__builtin_ia32_gather3div2di:
1347 intrinsicName =
"x86.avx512.mask.gather3div2.di";
1349 case X86::BI__builtin_ia32_gather3div4df:
1350 intrinsicName =
"x86.avx512.mask.gather3div4.df";
1352 case X86::BI__builtin_ia32_gather3div4di:
1353 intrinsicName =
"x86.avx512.mask.gather3div4.di";
1355 case X86::BI__builtin_ia32_gather3div4sf:
1356 intrinsicName =
"x86.avx512.mask.gather3div4.sf";
1358 case X86::BI__builtin_ia32_gather3div4si:
1359 intrinsicName =
"x86.avx512.mask.gather3div4.si";
1361 case X86::BI__builtin_ia32_gather3div8sf:
1362 intrinsicName =
"x86.avx512.mask.gather3div8.sf";
1364 case X86::BI__builtin_ia32_gather3div8si:
1365 intrinsicName =
"x86.avx512.mask.gather3div8.si";
1367 case X86::BI__builtin_ia32_gather3siv2df:
1368 intrinsicName =
"x86.avx512.mask.gather3siv2.df";
1370 case X86::BI__builtin_ia32_gather3siv2di:
1371 intrinsicName =
"x86.avx512.mask.gather3siv2.di";
1373 case X86::BI__builtin_ia32_gather3siv4df:
1374 intrinsicName =
"x86.avx512.mask.gather3siv4.df";
1376 case X86::BI__builtin_ia32_gather3siv4di:
1377 intrinsicName =
"x86.avx512.mask.gather3siv4.di";
1379 case X86::BI__builtin_ia32_gather3siv4sf:
1380 intrinsicName =
"x86.avx512.mask.gather3siv4.sf";
1382 case X86::BI__builtin_ia32_gather3siv4si:
1383 intrinsicName =
"x86.avx512.mask.gather3siv4.si";
1385 case X86::BI__builtin_ia32_gather3siv8sf:
1386 intrinsicName =
"x86.avx512.mask.gather3siv8.sf";
1388 case X86::BI__builtin_ia32_gather3siv8si:
1389 intrinsicName =
"x86.avx512.mask.gather3siv8.si";
1391 case X86::BI__builtin_ia32_gathersiv8df:
1392 intrinsicName =
"x86.avx512.mask.gather.dpd.512";
1394 case X86::BI__builtin_ia32_gathersiv16sf:
1395 intrinsicName =
"x86.avx512.mask.gather.dps.512";
1397 case X86::BI__builtin_ia32_gatherdiv8df:
1398 intrinsicName =
"x86.avx512.mask.gather.qpd.512";
1400 case X86::BI__builtin_ia32_gatherdiv16sf:
1401 intrinsicName =
"x86.avx512.mask.gather.qps.512";
1403 case X86::BI__builtin_ia32_gathersiv8di:
1404 intrinsicName =
"x86.avx512.mask.gather.dpq.512";
1406 case X86::BI__builtin_ia32_gathersiv16si:
1407 intrinsicName =
"x86.avx512.mask.gather.dpi.512";
1409 case X86::BI__builtin_ia32_gatherdiv8di:
1410 intrinsicName =
"x86.avx512.mask.gather.qpq.512";
1412 case X86::BI__builtin_ia32_gatherdiv16si:
1413 intrinsicName =
"x86.avx512.mask.gather.qpi.512";
1417 mlir::Location loc =
getLoc(
expr->getExprLoc());
1422 return builder.emitIntrinsicCallOp(loc, intrinsicName,
1425 case X86::BI__builtin_ia32_scattersiv8df:
1426 case X86::BI__builtin_ia32_scattersiv16sf:
1427 case X86::BI__builtin_ia32_scatterdiv8df:
1428 case X86::BI__builtin_ia32_scatterdiv16sf:
1429 case X86::BI__builtin_ia32_scattersiv8di:
1430 case X86::BI__builtin_ia32_scattersiv16si:
1431 case X86::BI__builtin_ia32_scatterdiv8di:
1432 case X86::BI__builtin_ia32_scatterdiv16si:
1433 case X86::BI__builtin_ia32_scatterdiv2df:
1434 case X86::BI__builtin_ia32_scatterdiv2di:
1435 case X86::BI__builtin_ia32_scatterdiv4df:
1436 case X86::BI__builtin_ia32_scatterdiv4di:
1437 case X86::BI__builtin_ia32_scatterdiv4sf:
1438 case X86::BI__builtin_ia32_scatterdiv4si:
1439 case X86::BI__builtin_ia32_scatterdiv8sf:
1440 case X86::BI__builtin_ia32_scatterdiv8si:
1441 case X86::BI__builtin_ia32_scattersiv2df:
1442 case X86::BI__builtin_ia32_scattersiv2di:
1443 case X86::BI__builtin_ia32_scattersiv4df:
1444 case X86::BI__builtin_ia32_scattersiv4di:
1445 case X86::BI__builtin_ia32_scattersiv4sf:
1446 case X86::BI__builtin_ia32_scattersiv4si:
1447 case X86::BI__builtin_ia32_scattersiv8sf:
1448 case X86::BI__builtin_ia32_scattersiv8si: {
1449 llvm::StringRef intrinsicName;
1450 switch (builtinID) {
1452 llvm_unreachable(
"Unexpected builtin");
1453 case X86::BI__builtin_ia32_scattersiv8df:
1454 intrinsicName =
"x86.avx512.mask.scatter.dpd.512";
1456 case X86::BI__builtin_ia32_scattersiv16sf:
1457 intrinsicName =
"x86.avx512.mask.scatter.dps.512";
1459 case X86::BI__builtin_ia32_scatterdiv8df:
1460 intrinsicName =
"x86.avx512.mask.scatter.qpd.512";
1462 case X86::BI__builtin_ia32_scatterdiv16sf:
1463 intrinsicName =
"x86.avx512.mask.scatter.qps.512";
1465 case X86::BI__builtin_ia32_scattersiv8di:
1466 intrinsicName =
"x86.avx512.mask.scatter.dpq.512";
1468 case X86::BI__builtin_ia32_scattersiv16si:
1469 intrinsicName =
"x86.avx512.mask.scatter.dpi.512";
1471 case X86::BI__builtin_ia32_scatterdiv8di:
1472 intrinsicName =
"x86.avx512.mask.scatter.qpq.512";
1474 case X86::BI__builtin_ia32_scatterdiv16si:
1475 intrinsicName =
"x86.avx512.mask.scatter.qpi.512";
1477 case X86::BI__builtin_ia32_scatterdiv2df:
1478 intrinsicName =
"x86.avx512.mask.scatterdiv2.df";
1480 case X86::BI__builtin_ia32_scatterdiv2di:
1481 intrinsicName =
"x86.avx512.mask.scatterdiv2.di";
1483 case X86::BI__builtin_ia32_scatterdiv4df:
1484 intrinsicName =
"x86.avx512.mask.scatterdiv4.df";
1486 case X86::BI__builtin_ia32_scatterdiv4di:
1487 intrinsicName =
"x86.avx512.mask.scatterdiv4.di";
1489 case X86::BI__builtin_ia32_scatterdiv4sf:
1490 intrinsicName =
"x86.avx512.mask.scatterdiv4.sf";
1492 case X86::BI__builtin_ia32_scatterdiv4si:
1493 intrinsicName =
"x86.avx512.mask.scatterdiv4.si";
1495 case X86::BI__builtin_ia32_scatterdiv8sf:
1496 intrinsicName =
"x86.avx512.mask.scatterdiv8.sf";
1498 case X86::BI__builtin_ia32_scatterdiv8si:
1499 intrinsicName =
"x86.avx512.mask.scatterdiv8.si";
1501 case X86::BI__builtin_ia32_scattersiv2df:
1502 intrinsicName =
"x86.avx512.mask.scattersiv2.df";
1504 case X86::BI__builtin_ia32_scattersiv2di:
1505 intrinsicName =
"x86.avx512.mask.scattersiv2.di";
1507 case X86::BI__builtin_ia32_scattersiv4df:
1508 intrinsicName =
"x86.avx512.mask.scattersiv4.df";
1510 case X86::BI__builtin_ia32_scattersiv4di:
1511 intrinsicName =
"x86.avx512.mask.scattersiv4.di";
1513 case X86::BI__builtin_ia32_scattersiv4sf:
1514 intrinsicName =
"x86.avx512.mask.scattersiv4.sf";
1516 case X86::BI__builtin_ia32_scattersiv4si:
1517 intrinsicName =
"x86.avx512.mask.scattersiv4.si";
1519 case X86::BI__builtin_ia32_scattersiv8sf:
1520 intrinsicName =
"x86.avx512.mask.scattersiv8.sf";
1522 case X86::BI__builtin_ia32_scattersiv8si:
1523 intrinsicName =
"x86.avx512.mask.scattersiv8.si";
1527 mlir::Location loc =
getLoc(
expr->getExprLoc());
1533 return builder.emitIntrinsicCallOp(loc, intrinsicName,
1536 case X86::BI__builtin_ia32_vextractf128_pd256:
1537 case X86::BI__builtin_ia32_vextractf128_ps256:
1538 case X86::BI__builtin_ia32_vextractf128_si256:
1539 case X86::BI__builtin_ia32_extract128i256:
1540 case X86::BI__builtin_ia32_extractf64x4_mask:
1541 case X86::BI__builtin_ia32_extractf32x4_mask:
1542 case X86::BI__builtin_ia32_extracti64x4_mask:
1543 case X86::BI__builtin_ia32_extracti32x4_mask:
1544 case X86::BI__builtin_ia32_extractf32x8_mask:
1545 case X86::BI__builtin_ia32_extracti32x8_mask:
1546 case X86::BI__builtin_ia32_extractf32x4_256_mask:
1547 case X86::BI__builtin_ia32_extracti32x4_256_mask:
1548 case X86::BI__builtin_ia32_extractf64x2_256_mask:
1549 case X86::BI__builtin_ia32_extracti64x2_256_mask:
1550 case X86::BI__builtin_ia32_extractf64x2_512_mask:
1551 case X86::BI__builtin_ia32_extracti64x2_512_mask: {
1552 mlir::Location loc =
getLoc(
expr->getExprLoc());
1554 unsigned numElts = dstTy.getSize();
1556 unsigned subVectors = srcNumElts / numElts;
1557 assert(llvm::isPowerOf2_32(subVectors) &&
"Expected power of 2 subvectors");
1559 ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue();
1561 index &= subVectors - 1;
1564 int64_t indices[16];
1565 std::iota(indices, indices + numElts,
index);
1567 mlir::Value poison =
1568 builder.getConstant(loc, cir::PoisonAttr::get(ops[0].
getType()));
1569 mlir::Value res = builder.createVecShuffle(loc, ops[0], poison,
1571 if (ops.size() == 4)
1576 case X86::BI__builtin_ia32_vinsertf128_pd256:
1577 case X86::BI__builtin_ia32_vinsertf128_ps256:
1578 case X86::BI__builtin_ia32_vinsertf128_si256:
1579 case X86::BI__builtin_ia32_insert128i256:
1580 case X86::BI__builtin_ia32_insertf64x4:
1581 case X86::BI__builtin_ia32_insertf32x4:
1582 case X86::BI__builtin_ia32_inserti64x4:
1583 case X86::BI__builtin_ia32_inserti32x4:
1584 case X86::BI__builtin_ia32_insertf32x8:
1585 case X86::BI__builtin_ia32_inserti32x8:
1586 case X86::BI__builtin_ia32_insertf32x4_256:
1587 case X86::BI__builtin_ia32_inserti32x4_256:
1588 case X86::BI__builtin_ia32_insertf64x2_256:
1589 case X86::BI__builtin_ia32_inserti64x2_256:
1590 case X86::BI__builtin_ia32_insertf64x2_512:
1591 case X86::BI__builtin_ia32_inserti64x2_512: {
1594 unsigned subVectors = dstNumElts / srcNumElts;
1595 assert(llvm::isPowerOf2_32(subVectors) &&
"Expected power of 2 subvectors");
1596 assert(dstNumElts <= 16);
1599 index &= subVectors - 1;
1600 index *= srcNumElts;
1603 for (
unsigned i = 0; i != dstNumElts; ++i)
1604 mask[i] = (i >= srcNumElts) ? srcNumElts + (i % srcNumElts) : i;
1607 builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[1], mask);
1609 for (
unsigned i = 0; i != dstNumElts; ++i) {
1611 mask[i] = (i -
index) + dstNumElts;
1616 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], op1,
1619 case X86::BI__builtin_ia32_pmovqd512_mask:
1620 case X86::BI__builtin_ia32_pmovwb512_mask: {
1626 case X86::BI__builtin_ia32_pblendw128:
1627 case X86::BI__builtin_ia32_blendpd:
1628 case X86::BI__builtin_ia32_blendps:
1629 case X86::BI__builtin_ia32_blendpd256:
1630 case X86::BI__builtin_ia32_blendps256:
1631 case X86::BI__builtin_ia32_pblendw256:
1632 case X86::BI__builtin_ia32_pblendd128:
1633 case X86::BI__builtin_ia32_pblendd256: {
1640 mlir::Type i32Ty = builder.getSInt32Ty();
1641 for (
unsigned i = 0; i != numElts; ++i)
1643 cir::IntAttr::get(i32Ty, ((imm >> (i % 8)) & 0x1) ? numElts + i : i));
1645 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], ops[1],
1648 case X86::BI__builtin_ia32_pshuflw:
1649 case X86::BI__builtin_ia32_pshuflw256:
1650 case X86::BI__builtin_ia32_pshuflw512:
1653 case X86::BI__builtin_ia32_pshufhw:
1654 case X86::BI__builtin_ia32_pshufhw256:
1655 case X86::BI__builtin_ia32_pshufhw512:
1658 case X86::BI__builtin_ia32_pshufd:
1659 case X86::BI__builtin_ia32_pshufd256:
1660 case X86::BI__builtin_ia32_pshufd512:
1661 case X86::BI__builtin_ia32_vpermilpd:
1662 case X86::BI__builtin_ia32_vpermilps:
1663 case X86::BI__builtin_ia32_vpermilpd256:
1664 case X86::BI__builtin_ia32_vpermilps256:
1665 case X86::BI__builtin_ia32_vpermilpd512:
1666 case X86::BI__builtin_ia32_vpermilps512: {
1672 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], mask);
1674 case X86::BI__builtin_ia32_shufpd:
1675 case X86::BI__builtin_ia32_shufpd256:
1676 case X86::BI__builtin_ia32_shufpd512:
1677 case X86::BI__builtin_ia32_shufps:
1678 case X86::BI__builtin_ia32_shufps256:
1679 case X86::BI__builtin_ia32_shufps512: {
1685 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], ops[1],
1688 case X86::BI__builtin_ia32_permdi256:
1689 case X86::BI__builtin_ia32_permdf256:
1690 case X86::BI__builtin_ia32_permdi512:
1691 case X86::BI__builtin_ia32_permdf512: {
1693 ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue();
1699 for (
unsigned l = 0; l != numElts; l += 4)
1700 for (
unsigned i = 0; i != 4; ++i)
1701 Indices[l + i] = l + ((imm >> (2 * i)) & 0x3);
1703 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0],
1706 case X86::BI__builtin_ia32_palignr128:
1707 case X86::BI__builtin_ia32_palignr256:
1708 case X86::BI__builtin_ia32_palignr512: {
1712 assert(numElts % 16 == 0);
1722 if (shiftVal > 16) {
1729 int64_t indices[64];
1731 for (
unsigned l = 0; l != numElts; l += 16) {
1732 for (
unsigned i = 0; i != 16; ++i) {
1733 uint32_t idx = shiftVal + i;
1735 idx += numElts - 16;
1736 indices[l + i] = l + idx;
1740 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[1], ops[0],
1743 case X86::BI__builtin_ia32_alignd128:
1744 case X86::BI__builtin_ia32_alignd256:
1745 case X86::BI__builtin_ia32_alignd512:
1746 case X86::BI__builtin_ia32_alignq128:
1747 case X86::BI__builtin_ia32_alignq256:
1748 case X86::BI__builtin_ia32_alignq512: {
1751 ops[2].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue() &
1755 shiftVal &= numElts - 1;
1758 mlir::Type i32Ty = builder.getSInt32Ty();
1759 for (
unsigned i = 0; i != numElts; ++i)
1760 indices.push_back(cir::IntAttr::get(i32Ty, i + shiftVal));
1762 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], ops[1],
1765 case X86::BI__builtin_ia32_shuf_f32x4_256:
1766 case X86::BI__builtin_ia32_shuf_f64x2_256:
1767 case X86::BI__builtin_ia32_shuf_i32x4_256:
1768 case X86::BI__builtin_ia32_shuf_i64x2_256:
1769 case X86::BI__builtin_ia32_shuf_f32x4:
1770 case X86::BI__builtin_ia32_shuf_f64x2:
1771 case X86::BI__builtin_ia32_shuf_i32x4:
1772 case X86::BI__builtin_ia32_shuf_i64x2: {
1773 mlir::Value src1 = ops[0];
1774 mlir::Value src2 = ops[1];
1777 ops[2].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue();
1781 unsigned numLanes = totalBits == 512 ? 4 : 2;
1782 unsigned numElemsPerLane = numElems / numLanes;
1785 mlir::Type i32Ty = builder.getSInt32Ty();
1787 for (
unsigned l = 0; l != numElems; l += numElemsPerLane) {
1788 unsigned index = (imm % numLanes) * numElemsPerLane;
1790 if (l >= (numElems / 2))
1792 for (
unsigned i = 0; i != numElemsPerLane; ++i) {
1793 indices.push_back(cir::IntAttr::get(i32Ty,
index + i));
1797 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), src1, src2,
1800 case X86::BI__builtin_ia32_vperm2f128_pd256:
1801 case X86::BI__builtin_ia32_vperm2f128_ps256:
1802 case X86::BI__builtin_ia32_vperm2f128_si256:
1803 case X86::BI__builtin_ia32_permti256:
1804 case X86::BI__builtin_ia32_pslldqi128_byteshift:
1805 case X86::BI__builtin_ia32_pslldqi256_byteshift:
1806 case X86::BI__builtin_ia32_pslldqi512_byteshift:
1807 case X86::BI__builtin_ia32_psrldqi128_byteshift:
1808 case X86::BI__builtin_ia32_psrldqi256_byteshift:
1809 case X86::BI__builtin_ia32_psrldqi512_byteshift:
1810 cgm.errorNYI(
expr->getSourceRange(),
1811 std::string(
"unimplemented X86 builtin call: ") +
1812 getContext().BuiltinInfo.getName(builtinID));
1813 return mlir::Value{};
1814 case X86::BI__builtin_ia32_kshiftliqi:
1815 case X86::BI__builtin_ia32_kshiftlihi:
1816 case X86::BI__builtin_ia32_kshiftlisi:
1817 case X86::BI__builtin_ia32_kshiftlidi: {
1818 mlir::Location loc =
getLoc(
expr->getExprLoc());
1820 ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue() &
1824 if (shiftVal >= numElems)
1825 return builder.getNullValue(ops[0].
getType(), loc);
1830 mlir::Type i32Ty = builder.getSInt32Ty();
1831 for (
auto i : llvm::seq<unsigned>(0, numElems))
1832 indices.push_back(cir::IntAttr::get(i32Ty, numElems + i - shiftVal));
1834 mlir::Value zero = builder.getNullValue(
in.getType(), loc);
1835 mlir::Value sv = builder.createVecShuffle(loc, zero,
in, indices);
1836 return builder.createBitcast(sv, ops[0].
getType());
1838 case X86::BI__builtin_ia32_kshiftriqi:
1839 case X86::BI__builtin_ia32_kshiftrihi:
1840 case X86::BI__builtin_ia32_kshiftrisi:
1841 case X86::BI__builtin_ia32_kshiftridi: {
1842 mlir::Location loc =
getLoc(
expr->getExprLoc());
1844 ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue() &
1848 if (shiftVal >= numElems)
1849 return builder.getNullValue(ops[0].
getType(), loc);
1854 mlir::Type i32Ty = builder.getSInt32Ty();
1855 for (
auto i : llvm::seq<unsigned>(0, numElems))
1856 indices.push_back(cir::IntAttr::get(i32Ty, i + shiftVal));
1858 mlir::Value zero = builder.getNullValue(
in.getType(), loc);
1859 mlir::Value sv = builder.createVecShuffle(loc,
in, zero, indices);
1860 return builder.createBitcast(sv, ops[0].
getType());
1862 case X86::BI__builtin_ia32_vprotbi:
1863 case X86::BI__builtin_ia32_vprotwi:
1864 case X86::BI__builtin_ia32_vprotdi:
1865 case X86::BI__builtin_ia32_vprotqi:
1866 case X86::BI__builtin_ia32_prold128:
1867 case X86::BI__builtin_ia32_prold256:
1868 case X86::BI__builtin_ia32_prold512:
1869 case X86::BI__builtin_ia32_prolq128:
1870 case X86::BI__builtin_ia32_prolq256:
1871 case X86::BI__builtin_ia32_prolq512:
1873 ops[0], ops[1],
false);
1874 case X86::BI__builtin_ia32_prord128:
1875 case X86::BI__builtin_ia32_prord256:
1876 case X86::BI__builtin_ia32_prord512:
1877 case X86::BI__builtin_ia32_prorq128:
1878 case X86::BI__builtin_ia32_prorq256:
1879 case X86::BI__builtin_ia32_prorq512:
1881 ops[0], ops[1],
true);
1882 case X86::BI__builtin_ia32_selectb_128:
1883 case X86::BI__builtin_ia32_selectb_256:
1884 case X86::BI__builtin_ia32_selectb_512:
1885 case X86::BI__builtin_ia32_selectw_128:
1886 case X86::BI__builtin_ia32_selectw_256:
1887 case X86::BI__builtin_ia32_selectw_512:
1888 case X86::BI__builtin_ia32_selectd_128:
1889 case X86::BI__builtin_ia32_selectd_256:
1890 case X86::BI__builtin_ia32_selectd_512:
1891 case X86::BI__builtin_ia32_selectq_128:
1892 case X86::BI__builtin_ia32_selectq_256:
1893 case X86::BI__builtin_ia32_selectq_512:
1894 case X86::BI__builtin_ia32_selectph_128:
1895 case X86::BI__builtin_ia32_selectph_256:
1896 case X86::BI__builtin_ia32_selectph_512:
1897 case X86::BI__builtin_ia32_selectpbf_128:
1898 case X86::BI__builtin_ia32_selectpbf_256:
1899 case X86::BI__builtin_ia32_selectpbf_512:
1900 case X86::BI__builtin_ia32_selectps_128:
1901 case X86::BI__builtin_ia32_selectps_256:
1902 case X86::BI__builtin_ia32_selectps_512:
1903 case X86::BI__builtin_ia32_selectpd_128:
1904 case X86::BI__builtin_ia32_selectpd_256:
1905 case X86::BI__builtin_ia32_selectpd_512:
1908 case X86::BI__builtin_ia32_selectsh_128:
1909 case X86::BI__builtin_ia32_selectsbf_128:
1910 case X86::BI__builtin_ia32_selectss_128:
1911 case X86::BI__builtin_ia32_selectsd_128: {
1912 mlir::Location loc =
getLoc(
expr->getExprLoc());
1913 mlir::Value scalar1 =
1914 builder.createExtractElement(loc, ops[1], uint64_t(0));
1915 mlir::Value scalar2 =
1916 builder.createExtractElement(loc, ops[2], uint64_t(0));
1917 mlir::Value result =
1919 return builder.createInsertElement(loc, ops[1], result, uint64_t(0));
1921 case X86::BI__builtin_ia32_cmpb128_mask:
1922 case X86::BI__builtin_ia32_cmpb256_mask:
1923 case X86::BI__builtin_ia32_cmpb512_mask:
1924 case X86::BI__builtin_ia32_cmpw128_mask:
1925 case X86::BI__builtin_ia32_cmpw256_mask:
1926 case X86::BI__builtin_ia32_cmpw512_mask:
1927 case X86::BI__builtin_ia32_cmpd128_mask:
1928 case X86::BI__builtin_ia32_cmpd256_mask:
1929 case X86::BI__builtin_ia32_cmpd512_mask:
1930 case X86::BI__builtin_ia32_cmpq128_mask:
1931 case X86::BI__builtin_ia32_cmpq256_mask:
1932 case X86::BI__builtin_ia32_cmpq512_mask:
1933 case X86::BI__builtin_ia32_ucmpb128_mask:
1934 case X86::BI__builtin_ia32_ucmpb256_mask:
1935 case X86::BI__builtin_ia32_ucmpb512_mask:
1936 case X86::BI__builtin_ia32_ucmpw128_mask:
1937 case X86::BI__builtin_ia32_ucmpw256_mask:
1938 case X86::BI__builtin_ia32_ucmpw512_mask:
1939 case X86::BI__builtin_ia32_ucmpd128_mask:
1940 case X86::BI__builtin_ia32_ucmpd256_mask:
1941 case X86::BI__builtin_ia32_ucmpd512_mask:
1942 case X86::BI__builtin_ia32_ucmpq128_mask:
1943 case X86::BI__builtin_ia32_ucmpq256_mask:
1944 case X86::BI__builtin_ia32_ucmpq512_mask: {
1949 case X86::BI__builtin_ia32_vpcomb:
1950 case X86::BI__builtin_ia32_vpcomw:
1951 case X86::BI__builtin_ia32_vpcomd:
1952 case X86::BI__builtin_ia32_vpcomq:
1954 case X86::BI__builtin_ia32_vpcomub:
1955 case X86::BI__builtin_ia32_vpcomuw:
1956 case X86::BI__builtin_ia32_vpcomud:
1957 case X86::BI__builtin_ia32_vpcomuq:
1959 case X86::BI__builtin_ia32_kortestcqi:
1960 case X86::BI__builtin_ia32_kortestchi:
1961 case X86::BI__builtin_ia32_kortestcsi:
1962 case X86::BI__builtin_ia32_kortestcdi: {
1963 mlir::Location loc =
getLoc(
expr->getExprLoc());
1965 mlir::Value allOnesOp =
1966 builder.getConstAPInt(loc, ty, APInt::getAllOnes(ty.getWidth()));
1969 cir::CmpOp::create(builder, loc, cir::CmpOpKind::eq, orOp, allOnesOp);
1970 return builder.createCast(cir::CastKind::bool_to_int, cmp,
1971 cgm.convertType(
expr->getType()));
1973 case X86::BI__builtin_ia32_kortestzqi:
1974 case X86::BI__builtin_ia32_kortestzhi:
1975 case X86::BI__builtin_ia32_kortestzsi:
1976 case X86::BI__builtin_ia32_kortestzdi: {
1977 mlir::Location loc =
getLoc(
expr->getExprLoc());
1979 mlir::Value allZerosOp = builder.getNullValue(ty, loc).getResult();
1982 cir::CmpOp::create(builder, loc, cir::CmpOpKind::eq, orOp, allZerosOp);
1983 return builder.createCast(cir::CastKind::bool_to_int, cmp,
1984 cgm.convertType(
expr->getType()));
1986 case X86::BI__builtin_ia32_ktestcqi:
1988 "x86.avx512.ktestc.b", ops);
1989 case X86::BI__builtin_ia32_ktestzqi:
1991 "x86.avx512.ktestz.b", ops);
1992 case X86::BI__builtin_ia32_ktestchi:
1994 "x86.avx512.ktestc.w", ops);
1995 case X86::BI__builtin_ia32_ktestzhi:
1997 "x86.avx512.ktestz.w", ops);
1998 case X86::BI__builtin_ia32_ktestcsi:
2000 "x86.avx512.ktestc.d", ops);
2001 case X86::BI__builtin_ia32_ktestzsi:
2003 "x86.avx512.ktestz.d", ops);
2004 case X86::BI__builtin_ia32_ktestcdi:
2006 "x86.avx512.ktestc.q", ops);
2007 case X86::BI__builtin_ia32_ktestzdi:
2009 "x86.avx512.ktestz.q", ops);
2010 case X86::BI__builtin_ia32_kaddqi:
2012 "x86.avx512.kadd.b", ops);
2013 case X86::BI__builtin_ia32_kaddhi:
2015 "x86.avx512.kadd.w", ops);
2016 case X86::BI__builtin_ia32_kaddsi:
2018 "x86.avx512.kadd.d", ops);
2019 case X86::BI__builtin_ia32_kadddi:
2021 "x86.avx512.kadd.q", ops);
2022 case X86::BI__builtin_ia32_kandqi:
2023 case X86::BI__builtin_ia32_kandhi:
2024 case X86::BI__builtin_ia32_kandsi:
2025 case X86::BI__builtin_ia32_kanddi:
2028 case X86::BI__builtin_ia32_kandnqi:
2029 case X86::BI__builtin_ia32_kandnhi:
2030 case X86::BI__builtin_ia32_kandnsi:
2031 case X86::BI__builtin_ia32_kandndi:
2034 case X86::BI__builtin_ia32_korqi:
2035 case X86::BI__builtin_ia32_korhi:
2036 case X86::BI__builtin_ia32_korsi:
2037 case X86::BI__builtin_ia32_kordi:
2040 case X86::BI__builtin_ia32_kxnorqi:
2041 case X86::BI__builtin_ia32_kxnorhi:
2042 case X86::BI__builtin_ia32_kxnorsi:
2043 case X86::BI__builtin_ia32_kxnordi:
2046 case X86::BI__builtin_ia32_kxorqi:
2047 case X86::BI__builtin_ia32_kxorhi:
2048 case X86::BI__builtin_ia32_kxorsi:
2049 case X86::BI__builtin_ia32_kxordi:
2052 case X86::BI__builtin_ia32_knotqi:
2053 case X86::BI__builtin_ia32_knothi:
2054 case X86::BI__builtin_ia32_knotsi:
2055 case X86::BI__builtin_ia32_knotdi: {
2057 unsigned numElts = intTy.getWidth();
2058 mlir::Value resVec =
2060 return builder.createBitcast(builder.createNot(resVec), ops[0].getType());
2062 case X86::BI__builtin_ia32_kmovb:
2063 case X86::BI__builtin_ia32_kmovw:
2064 case X86::BI__builtin_ia32_kmovd:
2065 case X86::BI__builtin_ia32_kmovq: {
2070 unsigned numElts = intTy.getWidth();
2071 mlir::Value resVec =
2073 return builder.createBitcast(resVec, ops[0].
getType());
2075 case X86::BI__builtin_ia32_sqrtsh_round_mask:
2076 case X86::BI__builtin_ia32_sqrtsd_round_mask:
2077 case X86::BI__builtin_ia32_sqrtss_round_mask:
2078 cgm.errorNYI(
expr->getSourceRange(),
2079 std::string(
"unimplemented X86 builtin call: ") +
2080 getContext().BuiltinInfo.getName(builtinID));
2081 return mlir::Value{};
2082 case X86::BI__builtin_ia32_sqrtph512:
2083 case X86::BI__builtin_ia32_sqrtps512:
2084 case X86::BI__builtin_ia32_sqrtpd512: {
2085 mlir::Location loc =
getLoc(
expr->getExprLoc());
2086 mlir::Value arg = ops[0];
2087 return cir::SqrtOp::create(builder, loc, arg.getType(), arg).getResult();
2089 case X86::BI__builtin_ia32_pmuludq128:
2090 case X86::BI__builtin_ia32_pmuludq256:
2091 case X86::BI__builtin_ia32_pmuludq512: {
2092 unsigned opTypePrimitiveSizeInBits =
2093 cgm.getDataLayout().getTypeSizeInBits(ops[0].
getType());
2095 ops, opTypePrimitiveSizeInBits);
2097 case X86::BI__builtin_ia32_pmuldq128:
2098 case X86::BI__builtin_ia32_pmuldq256:
2099 case X86::BI__builtin_ia32_pmuldq512: {
2100 unsigned opTypePrimitiveSizeInBits =
2101 cgm.getDataLayout().getTypeSizeInBits(ops[0].
getType());
2103 ops, opTypePrimitiveSizeInBits);
2105 case X86::BI__builtin_ia32_pternlogd512_mask:
2106 case X86::BI__builtin_ia32_pternlogq512_mask:
2107 case X86::BI__builtin_ia32_pternlogd128_mask:
2108 case X86::BI__builtin_ia32_pternlogd256_mask:
2109 case X86::BI__builtin_ia32_pternlogq128_mask:
2110 case X86::BI__builtin_ia32_pternlogq256_mask:
2111 case X86::BI__builtin_ia32_pternlogd512_maskz:
2112 case X86::BI__builtin_ia32_pternlogq512_maskz:
2113 case X86::BI__builtin_ia32_pternlogd128_maskz:
2114 case X86::BI__builtin_ia32_pternlogd256_maskz:
2115 case X86::BI__builtin_ia32_pternlogq128_maskz:
2116 case X86::BI__builtin_ia32_pternlogq256_maskz:
2117 cgm.errorNYI(
expr->getSourceRange(),
2118 std::string(
"unimplemented X86 builtin call: ") +
2119 getContext().BuiltinInfo.getName(builtinID));
2120 return mlir::Value{};
2121 case X86::BI__builtin_ia32_vpshldd128:
2122 case X86::BI__builtin_ia32_vpshldd256:
2123 case X86::BI__builtin_ia32_vpshldd512:
2124 case X86::BI__builtin_ia32_vpshldq128:
2125 case X86::BI__builtin_ia32_vpshldq256:
2126 case X86::BI__builtin_ia32_vpshldq512:
2127 case X86::BI__builtin_ia32_vpshldw128:
2128 case X86::BI__builtin_ia32_vpshldw256:
2129 case X86::BI__builtin_ia32_vpshldw512:
2131 ops[1], ops[2],
false);
2132 case X86::BI__builtin_ia32_vpshrdd128:
2133 case X86::BI__builtin_ia32_vpshrdd256:
2134 case X86::BI__builtin_ia32_vpshrdd512:
2135 case X86::BI__builtin_ia32_vpshrdq128:
2136 case X86::BI__builtin_ia32_vpshrdq256:
2137 case X86::BI__builtin_ia32_vpshrdq512:
2138 case X86::BI__builtin_ia32_vpshrdw128:
2139 case X86::BI__builtin_ia32_vpshrdw256:
2140 case X86::BI__builtin_ia32_vpshrdw512:
2143 ops[0], ops[2],
true);
2144 case X86::BI__builtin_ia32_reduce_fadd_pd512:
2145 case X86::BI__builtin_ia32_reduce_fadd_ps512:
2146 case X86::BI__builtin_ia32_reduce_fadd_ph512:
2147 case X86::BI__builtin_ia32_reduce_fadd_ph256:
2148 case X86::BI__builtin_ia32_reduce_fadd_ph128: {
2150 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
2151 "vector.reduce.fadd", ops[0].getType(),
2152 mlir::ValueRange{ops[0], ops[1]});
2154 case X86::BI__builtin_ia32_reduce_fmul_pd512:
2155 case X86::BI__builtin_ia32_reduce_fmul_ps512:
2156 case X86::BI__builtin_ia32_reduce_fmul_ph512:
2157 case X86::BI__builtin_ia32_reduce_fmul_ph256:
2158 case X86::BI__builtin_ia32_reduce_fmul_ph128: {
2160 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
2161 "vector.reduce.fmul", ops[0].getType(),
2162 mlir::ValueRange{ops[0], ops[1]});
2164 case X86::BI__builtin_ia32_reduce_fmax_pd512:
2165 case X86::BI__builtin_ia32_reduce_fmax_ps512:
2166 case X86::BI__builtin_ia32_reduce_fmax_ph512:
2167 case X86::BI__builtin_ia32_reduce_fmax_ph256:
2168 case X86::BI__builtin_ia32_reduce_fmax_ph128: {
2171 return builder.emitIntrinsicCallOp(
2172 getLoc(
expr->getExprLoc()),
"vector.reduce.fmax",
2173 vecTy.getElementType(), mlir::ValueRange{ops[0]});
2175 case X86::BI__builtin_ia32_reduce_fmin_pd512:
2176 case X86::BI__builtin_ia32_reduce_fmin_ps512:
2177 case X86::BI__builtin_ia32_reduce_fmin_ph512:
2178 case X86::BI__builtin_ia32_reduce_fmin_ph256:
2179 case X86::BI__builtin_ia32_reduce_fmin_ph128: {
2182 return builder.emitIntrinsicCallOp(
2183 getLoc(
expr->getExprLoc()),
"vector.reduce.fmin",
2184 vecTy.getElementType(), mlir::ValueRange{ops[0]});
2186 case X86::BI__builtin_ia32_rdrand16_step:
2187 case X86::BI__builtin_ia32_rdrand32_step:
2188 case X86::BI__builtin_ia32_rdrand64_step:
2189 case X86::BI__builtin_ia32_rdseed16_step:
2190 case X86::BI__builtin_ia32_rdseed32_step:
2191 case X86::BI__builtin_ia32_rdseed64_step: {
2192 llvm::StringRef intrinsicName;
2193 switch (builtinID) {
2195 llvm_unreachable(
"Unsupported intrinsic!");
2196 case X86::BI__builtin_ia32_rdrand16_step:
2197 intrinsicName =
"x86.rdrand.16";
2199 case X86::BI__builtin_ia32_rdrand32_step:
2200 intrinsicName =
"x86.rdrand.32";
2202 case X86::BI__builtin_ia32_rdrand64_step:
2203 intrinsicName =
"x86.rdrand.64";
2205 case X86::BI__builtin_ia32_rdseed16_step:
2206 intrinsicName =
"x86.rdseed.16";
2208 case X86::BI__builtin_ia32_rdseed32_step:
2209 intrinsicName =
"x86.rdseed.32";
2211 case X86::BI__builtin_ia32_rdseed64_step:
2212 intrinsicName =
"x86.rdseed.64";
2216 mlir::Location loc =
getLoc(
expr->getExprLoc());
2219 builder.getUInt32Ty()};
2220 cir::RecordType resRecord =
2221 cir::RecordType::get(&
getMLIRContext(), resultTypes,
false,
false,
2222 cir::RecordType::RecordKind::Struct);
2225 builder.emitIntrinsicCallOp(loc, intrinsicName, resRecord);
2227 cir::ExtractMemberOp::create(builder, loc, randTy, call, 0);
2228 builder.CIRBaseBuilderTy::createStore(loc, rand, ops[0]);
2230 return cir::ExtractMemberOp::create(builder, loc, builder.getUInt32Ty(),
2233 case X86::BI__builtin_ia32_addcarryx_u32:
2234 case X86::BI__builtin_ia32_addcarryx_u64:
2235 case X86::BI__builtin_ia32_subborrow_u32:
2236 case X86::BI__builtin_ia32_subborrow_u64:
2237 cgm.errorNYI(
expr->getSourceRange(),
2238 std::string(
"unimplemented X86 builtin call: ") +
2239 getContext().BuiltinInfo.getName(builtinID));
2240 return mlir::Value{};
2241 case X86::BI__builtin_ia32_fpclassps128_mask:
2242 case X86::BI__builtin_ia32_fpclassps256_mask:
2243 case X86::BI__builtin_ia32_fpclassps512_mask:
2244 case X86::BI__builtin_ia32_vfpclassbf16128_mask:
2245 case X86::BI__builtin_ia32_vfpclassbf16256_mask:
2246 case X86::BI__builtin_ia32_vfpclassbf16512_mask:
2247 case X86::BI__builtin_ia32_fpclassph128_mask:
2248 case X86::BI__builtin_ia32_fpclassph256_mask:
2249 case X86::BI__builtin_ia32_fpclassph512_mask:
2250 case X86::BI__builtin_ia32_fpclasspd128_mask:
2251 case X86::BI__builtin_ia32_fpclasspd256_mask:
2252 case X86::BI__builtin_ia32_fpclasspd512_mask:
2254 case X86::BI__builtin_ia32_vp2intersect_q_512:
2255 case X86::BI__builtin_ia32_vp2intersect_q_256:
2256 case X86::BI__builtin_ia32_vp2intersect_q_128:
2257 case X86::BI__builtin_ia32_vp2intersect_d_512:
2258 case X86::BI__builtin_ia32_vp2intersect_d_256:
2259 case X86::BI__builtin_ia32_vp2intersect_d_128: {
2261 mlir::Location loc =
getLoc(
expr->getExprLoc());
2262 StringRef intrinsicName;
2264 switch (builtinID) {
2266 llvm_unreachable(
"Unexpected builtin");
2267 case X86::BI__builtin_ia32_vp2intersect_q_512:
2268 intrinsicName =
"x86.avx512.vp2intersect.q.512";
2270 case X86::BI__builtin_ia32_vp2intersect_q_256:
2271 intrinsicName =
"x86.avx512.vp2intersect.q.256";
2273 case X86::BI__builtin_ia32_vp2intersect_q_128:
2274 intrinsicName =
"x86.avx512.vp2intersect.q.128";
2276 case X86::BI__builtin_ia32_vp2intersect_d_512:
2277 intrinsicName =
"x86.avx512.vp2intersect.d.512";
2279 case X86::BI__builtin_ia32_vp2intersect_d_256:
2280 intrinsicName =
"x86.avx512.vp2intersect.d.256";
2282 case X86::BI__builtin_ia32_vp2intersect_d_128:
2283 intrinsicName =
"x86.avx512.vp2intersect.d.128";
2287 auto resVector = cir::VectorType::get(builder.getBoolTy(), numElts);
2289 cir::RecordType resRecord =
2290 cir::RecordType::get(&
getMLIRContext(), {resVector, resVector},
false,
2291 false, cir::RecordType::RecordKind::Struct);
2293 mlir::Value call = builder.emitIntrinsicCallOp(
2294 getLoc(
expr->getExprLoc()), intrinsicName, resRecord,
2295 mlir::ValueRange{ops[0], ops[1]});
2296 mlir::Value result =
2297 cir::ExtractMemberOp::create(builder, loc, resVector, call, 0);
2301 builder.createStore(loc, result, addr);
2303 result = cir::ExtractMemberOp::create(builder, loc, resVector, call, 1);
2307 builder.createStore(loc, result, addr);
2308 return mlir::Value{};
2310 case X86::BI__builtin_ia32_vpmultishiftqb128:
2311 case X86::BI__builtin_ia32_vpmultishiftqb256:
2312 case X86::BI__builtin_ia32_vpmultishiftqb512:
2313 case X86::BI__builtin_ia32_vpshufbitqmb128_mask:
2314 case X86::BI__builtin_ia32_vpshufbitqmb256_mask:
2315 case X86::BI__builtin_ia32_vpshufbitqmb512_mask:
2316 case X86::BI__builtin_ia32_cmpeqps:
2317 case X86::BI__builtin_ia32_cmpeqpd:
2320 case X86::BI__builtin_ia32_cmpltps:
2321 case X86::BI__builtin_ia32_cmpltpd:
2324 case X86::BI__builtin_ia32_cmpleps:
2325 case X86::BI__builtin_ia32_cmplepd:
2328 case X86::BI__builtin_ia32_cmpunordps:
2329 case X86::BI__builtin_ia32_cmpunordpd:
2332 case X86::BI__builtin_ia32_cmpneqps:
2333 case X86::BI__builtin_ia32_cmpneqpd:
2336 case X86::BI__builtin_ia32_cmpnltps:
2337 case X86::BI__builtin_ia32_cmpnltpd:
2340 case X86::BI__builtin_ia32_cmpnleps:
2341 case X86::BI__builtin_ia32_cmpnlepd:
2344 case X86::BI__builtin_ia32_cmpordps:
2345 case X86::BI__builtin_ia32_cmpordpd:
2348 case X86::BI__builtin_ia32_cmpph128_mask:
2349 case X86::BI__builtin_ia32_cmpph256_mask:
2350 case X86::BI__builtin_ia32_cmpph512_mask:
2351 case X86::BI__builtin_ia32_cmpps128_mask:
2352 case X86::BI__builtin_ia32_cmpps256_mask:
2353 case X86::BI__builtin_ia32_cmpps512_mask:
2354 case X86::BI__builtin_ia32_cmppd128_mask:
2355 case X86::BI__builtin_ia32_cmppd256_mask:
2356 case X86::BI__builtin_ia32_cmppd512_mask:
2357 case X86::BI__builtin_ia32_vcmpbf16512_mask:
2358 case X86::BI__builtin_ia32_vcmpbf16256_mask:
2359 case X86::BI__builtin_ia32_vcmpbf16128_mask:
2360 case X86::BI__builtin_ia32_cmpps:
2361 case X86::BI__builtin_ia32_cmpps256:
2362 case X86::BI__builtin_ia32_cmppd:
2363 case X86::BI__builtin_ia32_cmppd256:
2364 case X86::BI__builtin_ia32_cmpeqss:
2365 case X86::BI__builtin_ia32_cmpltss:
2366 case X86::BI__builtin_ia32_cmpless:
2367 case X86::BI__builtin_ia32_cmpunordss:
2368 case X86::BI__builtin_ia32_cmpneqss:
2369 case X86::BI__builtin_ia32_cmpnltss:
2370 case X86::BI__builtin_ia32_cmpnless:
2371 case X86::BI__builtin_ia32_cmpordss:
2372 case X86::BI__builtin_ia32_cmpeqsd:
2373 case X86::BI__builtin_ia32_cmpltsd:
2374 case X86::BI__builtin_ia32_cmplesd:
2375 case X86::BI__builtin_ia32_cmpunordsd:
2376 case X86::BI__builtin_ia32_cmpneqsd:
2377 case X86::BI__builtin_ia32_cmpnltsd:
2378 case X86::BI__builtin_ia32_cmpnlesd:
2379 case X86::BI__builtin_ia32_cmpordsd:
2380 cgm.errorNYI(
expr->getSourceRange(),
2381 std::string(
"unimplemented X86 builtin call: ") +
2382 getContext().BuiltinInfo.getName(builtinID));
2384 case X86::BI__builtin_ia32_vcvtph2ps_mask:
2385 case X86::BI__builtin_ia32_vcvtph2ps256_mask:
2386 case X86::BI__builtin_ia32_vcvtph2ps512_mask: {
2387 mlir::Location loc =
getLoc(
expr->getExprLoc());
2391 case X86::BI__builtin_ia32_cvtneps2bf16_128_mask: {
2392 mlir::Location loc =
getLoc(
expr->getExprLoc());
2396 unsigned numElts = inputTy.getSize();
2401 args.push_back(ops[0]);
2402 args.push_back(ops[1]);
2403 args.push_back(mask);
2405 return builder.emitIntrinsicCallOp(
2406 loc,
"x86.avx512bf16.mask.cvtneps2bf16.128", resTy, args);
2408 case X86::BI__builtin_ia32_cvtneps2bf16_256_mask:
2409 case X86::BI__builtin_ia32_cvtneps2bf16_512_mask: {
2410 mlir::Location loc =
getLoc(
expr->getExprLoc());
2412 StringRef intrinsicName;
2413 if (builtinID == X86::BI__builtin_ia32_cvtneps2bf16_256_mask) {
2414 intrinsicName =
"x86.avx512bf16.cvtneps2bf16.256";
2416 assert(builtinID == X86::BI__builtin_ia32_cvtneps2bf16_512_mask);
2417 intrinsicName =
"x86.avx512bf16.cvtneps2bf16.512";
2420 mlir::Value res = builder.emitIntrinsicCallOp(loc, intrinsicName, resTy,
2421 mlir::ValueRange{ops[0]});
2425 case X86::BI__cpuid:
2426 case X86::BI__cpuidex: {
2427 mlir::Location loc =
getLoc(
expr->getExprLoc());
2428 mlir::Value subFuncId = builtinID == X86::BI__cpuidex
2430 : builder.getConstInt(loc,
sInt32Ty, 0);
2431 cir::CpuIdOp::create(builder, loc, ops[0],
2433 return mlir::Value{};
2436 case X86::BI__emulu:
2438 case X86::BI__umulh:
2439 case X86::BI_mul128:
2440 case X86::BI_umul128: {
2441 cgm.errorNYI(
expr->getSourceRange(),
2442 std::string(
"unimplemented X86 builtin call: ") +
2443 getContext().BuiltinInfo.getName(builtinID));
2444 return mlir::Value{};
2446 case X86::BI__faststorefence: {
2447 cir::AtomicFenceOp::create(
2449 cir::MemOrder::SequentiallyConsistent,
2451 cir::SyncScopeKind::System));
2452 return mlir::Value{};
2454 case X86::BI__shiftleft128:
2455 case X86::BI__shiftright128: {
2459 std::swap(ops[0], ops[1]);
2462 auto amtTy = mlir::cast<cir::IntType>(ops[2].
getType());
2463 cir::IntType i64Ty = builder.getUInt64Ty();
2466 ops[2] = builder.createIntCast(ops[2], i64Ty);
2468 const StringRef intrinsicName =
2469 (builtinID == X86::BI__shiftleft128) ?
"fshl" :
"fshr";
2470 return builder.emitIntrinsicCallOp(
2471 getLoc(
expr->getExprLoc()), intrinsicName, i64Ty,
2472 mlir::ValueRange{ops[0], ops[1], ops[2]});
2474 case X86::BI_ReadWriteBarrier:
2475 case X86::BI_ReadBarrier:
2476 case X86::BI_WriteBarrier: {
2477 cir::AtomicFenceOp::create(
2479 cir::MemOrder::SequentiallyConsistent,
2481 cir::SyncScopeKind::SingleThread));
2482 return mlir::Value{};
2484 case X86::BI_AddressOfReturnAddress: {
2485 mlir::Location loc =
getLoc(
expr->getExprLoc());
2488 return builder.createCast(loc, cir::CastKind::bitcast, addr,
voidPtrTy);
2490 case X86::BI__stosb:
2492 case X86::BI__int2c:
2493 case X86::BI__readfsbyte:
2494 case X86::BI__readfsword:
2495 case X86::BI__readfsdword:
2496 case X86::BI__readfsqword:
2497 case X86::BI__readgsbyte:
2498 case X86::BI__readgsword:
2499 case X86::BI__readgsdword:
2500 case X86::BI__readgsqword: {
2501 cgm.errorNYI(
expr->getSourceRange(),
2502 std::string(
"unimplemented X86 builtin call: ") +
2503 getContext().BuiltinInfo.getName(builtinID));
2504 return mlir::Value{};
2506 case X86::BI__builtin_ia32_encodekey128_u32: {
2508 {ops[0], ops[1]}, ops[2], 6,
"x86.encodekey128", 3);
2510 case X86::BI__builtin_ia32_encodekey256_u32: {
2513 {ops[0], ops[1], ops[2]}, ops[3], 7,
2514 "x86.encodekey256", 4);
2517 case X86::BI__builtin_ia32_aesenc128kl_u8:
2518 case X86::BI__builtin_ia32_aesdec128kl_u8:
2519 case X86::BI__builtin_ia32_aesenc256kl_u8:
2520 case X86::BI__builtin_ia32_aesdec256kl_u8: {
2521 llvm::StringRef intrinsicName;
2522 switch (builtinID) {
2524 llvm_unreachable(
"Unexpected builtin");
2525 case X86::BI__builtin_ia32_aesenc128kl_u8:
2526 intrinsicName =
"x86.aesenc128kl";
2528 case X86::BI__builtin_ia32_aesdec128kl_u8:
2529 intrinsicName =
"x86.aesdec128kl";
2531 case X86::BI__builtin_ia32_aesenc256kl_u8:
2532 intrinsicName =
"x86.aesenc256kl";
2534 case X86::BI__builtin_ia32_aesdec256kl_u8:
2535 intrinsicName =
"x86.aesdec256kl";
2542 case X86::BI__builtin_ia32_aesencwide128kl_u8:
2543 case X86::BI__builtin_ia32_aesdecwide128kl_u8:
2544 case X86::BI__builtin_ia32_aesencwide256kl_u8:
2545 case X86::BI__builtin_ia32_aesdecwide256kl_u8: {
2546 llvm::StringRef intrinsicName;
2547 switch (builtinID) {
2549 llvm_unreachable(
"Unexpected builtin");
2550 case X86::BI__builtin_ia32_aesencwide128kl_u8:
2551 intrinsicName =
"x86.aesencwide128kl";
2553 case X86::BI__builtin_ia32_aesdecwide128kl_u8:
2554 intrinsicName =
"x86.aesdecwide128kl";
2556 case X86::BI__builtin_ia32_aesencwide256kl_u8:
2557 intrinsicName =
"x86.aesencwide256kl";
2559 case X86::BI__builtin_ia32_aesdecwide256kl_u8:
2560 intrinsicName =
"x86.aesdecwide256kl";
2567 case X86::BI__builtin_ia32_vfcmaddcph512_mask:
2568 case X86::BI__builtin_ia32_vfmaddcph512_mask:
2569 case X86::BI__builtin_ia32_vfcmaddcsh_round_mask:
2570 case X86::BI__builtin_ia32_vfmaddcsh_round_mask:
2571 case X86::BI__builtin_ia32_vfcmaddcsh_round_mask3:
2572 case X86::BI__builtin_ia32_vfmaddcsh_round_mask3:
2573 case X86::BI__builtin_ia32_prefetchi:
2574 cgm.errorNYI(
expr->getSourceRange(),
2575 std::string(
"unimplemented X86 builtin call: ") +
2576 getContext().BuiltinInfo.getName(builtinID));
2577 return mlir::Value{};