clang 23.0.0git
CIRGenBuiltinAMDGPU.cpp
Go to the documentation of this file.
1//===---- CIRGenBuiltinAMDGPU.cpp - Emit CIR for AMDGPU builtins ----------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This contains code to emit AMDGPU Builtin calls.
10//
11//===----------------------------------------------------------------------===//
12
13#include "CIRGenFunction.h"
14
15#include "mlir/IR/Value.h"
17#include "llvm/Support/AMDGPUAddrSpace.h"
18#include "llvm/Support/ErrorHandling.h"
19
20using namespace clang;
21using namespace clang::CIRGen;
22using namespace cir;
23
24// Emit the `amdgcn.dispatch.ptr` intrinsic, address-space-casting the
25// result to match \p e's return type when needed.
26// If \p e is null, returns the raw AS-4 pointer.
27static mlir::Value emitAMDGPUDispatchPtr(CIRGenFunction &cgf,
28 const CallExpr *e = nullptr) {
29 CIRGenBuilderTy &builder = cgf.getBuilder();
30 mlir::Location loc =
31 e ? cgf.getLoc(e->getExprLoc()) : builder.getUnknownLoc();
32 // The intrinsic always returns a pointer in the constant AS.
33 mlir::Type retTy = cir::PointerType::get(
34 cir::VoidType::get(builder.getContext()),
35 cir::TargetAddressSpaceAttr::get(builder.getContext(),
36 llvm::AMDGPUAS::CONSTANT_ADDRESS));
37 mlir::Value call = builder.emitIntrinsicCallOp(loc, "amdgcn.dispatch.ptr",
38 retTy, mlir::ValueRange{});
39 if (!e)
40 return call;
41 // Only cast when the caller-visible AS differs from the intrinsic's AS;
42 auto expectedPtrTy =
43 mlir::cast<cir::PointerType>(cgf.convertType(e->getType()));
44 auto callPtrTy = mlir::cast<cir::PointerType>(call.getType());
45 if (expectedPtrTy.getAddrSpace() == callPtrTy.getAddrSpace())
46 return call;
47 return builder.createAddrSpaceCast(loc, call, expectedPtrTy);
48}
49
51 CIRGenFunction &cgf, const CallExpr *e, llvm::StringRef intrinsicName,
52 llvm::StringRef constrainedIntrinsicName) {
53 mlir::Value src0 = cgf.emitScalarExpr(e->getArg(0));
54 mlir::Value src1 = cgf.emitScalarExpr(e->getArg(1));
55 mlir::Location loc = cgf.getLoc(e->getExprLoc());
56
57 CIRGenBuilderTy &builder = cgf.getBuilder();
58
59 CIRGenFunction::CIRGenFPOptionsRAII fpOptsRAII(cgf, e);
60
61 if (builder.getIsFPConstrained()) {
63 "constrained FP intrinsic support is NYI.");
64 }
65
66 return builder.emitIntrinsicCallOp(loc, intrinsicName, src0.getType(),
67 mlir::ValueRange{src0, src1});
68}
69
70static mlir::Value emitLogbBuiltin(CIRGenFunction &cgf, const CallExpr *e,
71 const llvm::fltSemantics &fSem) {
72 CIRGenBuilderTy &builder = cgf.getBuilder();
73 mlir::Location loc = cgf.getLoc(e->getExprLoc());
74
75 mlir::Value src0 = cgf.emitScalarExpr(e->getArg(0));
76 mlir::Type srcTy = src0.getType();
77 mlir::Type int32Ty = builder.getSInt32Ty();
78
79 cir::RecordType frExpResTy =
80 builder.getAnonRecordTy({srcTy, int32Ty}, false, false);
81
82 mlir::Value frExpResult = builder.emitIntrinsicCallOp(
83 loc, "frexp", frExpResTy, mlir::ValueRange{src0});
84
85 mlir::Value exp =
86 cir::ExtractMemberOp::create(builder, loc, int32Ty, frExpResult, 1);
87
88 mlir::Value negativeOne =
89 builder.getConstant(loc, cir::IntAttr::get(int32Ty, -1));
90 mlir::Value expMinus1 = builder.createAdd(loc, exp, negativeOne);
91
92 mlir::Value siToFp = cir::CastOp::create(
93 builder, loc, srcTy, cir::CastKind::int_to_float, expMinus1);
94
95 mlir::Value fabs = cir::FAbsOp::create(builder, loc, srcTy, src0);
96
97 llvm::APFloat infVal = llvm::APFloat::getInf(fSem);
98 mlir::Value inf = builder.getConstant(loc, cir::FPAttr::get(srcTy, infVal));
99
100 mlir::Value fabsNegInf =
101 builder.createCompare(loc, cir::CmpOpKind::ne, fabs, inf);
102
103 mlir::Value sel = builder.createSelect(loc, fabsNegInf, siToFp, fabs);
104
105 llvm::APFloat zeroValue = llvm::APFloat::getZero(fSem);
106 mlir::Value zero =
107 builder.getConstant(loc, cir::FPAttr::get(srcTy, zeroValue));
108
109 mlir::Value srcEqZero =
110 builder.createCompare(loc, cir::CmpOpKind::eq, src0, zero);
111
112 llvm::APFloat negInfVal = llvm::APFloat::getInf(fSem, true);
113 mlir::Value negInf =
114 builder.getConstant(loc, cir::FPAttr::get(srcTy, negInfVal));
115
116 mlir::Value res = builder.createSelect(loc, srcEqZero, negInf, sel);
117
118 return res;
119}
120
121static mlir::Value
123 llvm::StringRef intrinsicName,
124 bool isImageStore) {
125 auto &builder = cgf.getBuilder();
126
128 for (unsigned i = 0, n = e->getNumArgs(); i < n; ++i)
129 args.push_back(cgf.emitScalarExpr(e->getArg(i)));
130
131 mlir::Type retTy = isImageStore ? cir::VoidType::get(builder.getContext())
132 : cgf.convertType(e->getType());
133
134 auto callOp = cir::LLVMIntrinsicCallOp::create(
135 builder, cgf.getLoc(e->getExprLoc()),
136 builder.getStringAttr(intrinsicName), retTy, args);
137
138 return callOp.getResult();
139}
140
141std::optional<mlir::Value>
143 const CallExpr *expr) {
144 switch (builtinId) {
145 case AMDGPU::BI__builtin_amdgcn_wave_reduce_add_u32:
146 case AMDGPU::BI__builtin_amdgcn_wave_reduce_sub_u32:
147 case AMDGPU::BI__builtin_amdgcn_wave_reduce_min_i32:
148 case AMDGPU::BI__builtin_amdgcn_wave_reduce_min_u32:
149 case AMDGPU::BI__builtin_amdgcn_wave_reduce_max_i32:
150 case AMDGPU::BI__builtin_amdgcn_wave_reduce_max_u32:
151 case AMDGPU::BI__builtin_amdgcn_wave_reduce_and_b32:
152 case AMDGPU::BI__builtin_amdgcn_wave_reduce_or_b32:
153 case AMDGPU::BI__builtin_amdgcn_wave_reduce_xor_b32:
154 case AMDGPU::BI__builtin_amdgcn_wave_reduce_add_u64:
155 case AMDGPU::BI__builtin_amdgcn_wave_reduce_sub_u64:
156 case AMDGPU::BI__builtin_amdgcn_wave_reduce_min_i64:
157 case AMDGPU::BI__builtin_amdgcn_wave_reduce_min_u64:
158 case AMDGPU::BI__builtin_amdgcn_wave_reduce_max_i64:
159 case AMDGPU::BI__builtin_amdgcn_wave_reduce_max_u64:
160 case AMDGPU::BI__builtin_amdgcn_wave_reduce_and_b64:
161 case AMDGPU::BI__builtin_amdgcn_wave_reduce_or_b64:
162 case AMDGPU::BI__builtin_amdgcn_wave_reduce_xor_b64: {
163 cgm.errorNYI(expr->getSourceRange(),
164 std::string("unimplemented AMDGPU builtin call: ") +
165 getContext().BuiltinInfo.getName(builtinId));
166 return mlir::Value{};
167 }
168 case AMDGPU::BI__builtin_amdgcn_div_scale:
169 case AMDGPU::BI__builtin_amdgcn_div_scalef: {
170 Address flagOutPtr = emitPointerWithAlignment(expr->getArg(3));
171 llvm::StringRef intrinsicName = "amdgcn.div.scale";
172 mlir::Value x = emitScalarExpr(expr->getArg(0));
173 mlir::Value y = emitScalarExpr(expr->getArg(1));
174 mlir::Value z = emitScalarExpr(expr->getArg(2));
175
176 auto i1Ty = builder.getUIntNTy(1);
177 cir::RecordType resTy = builder.getAnonRecordTy(
178 {x.getType(), i1Ty}, /*packed=*/false, /*padded=*/false);
179
180 mlir::Value structResult =
181 cir::LLVMIntrinsicCallOp::create(builder, getLoc(expr->getExprLoc()),
182 builder.getStringAttr(intrinsicName),
183 resTy, {x, y, z})
184 .getResult();
185
186 mlir::Value result = cir::ExtractMemberOp::create(
187 builder, getLoc(expr->getExprLoc()), x.getType(), structResult, 0);
188 mlir::Value flag = cir::ExtractMemberOp::create(
189 builder, getLoc(expr->getExprLoc()), i1Ty, structResult, 1);
190
191 mlir::Type flagType = flagOutPtr.getElementType();
192 mlir::Value flagToStore =
193 cir::CastOp::create(builder, getLoc(expr->getExprLoc()), flagType,
194 cir::CastKind::int_to_bool, flag);
195 builder.createStore(getLoc(expr->getExprLoc()), flagToStore, flagOutPtr);
196 return result;
197 }
198 case AMDGPU::BI__builtin_amdgcn_div_fmas:
199 case AMDGPU::BI__builtin_amdgcn_div_fmasf:
200 return emitBuiltinWithOneOverloadedType<4>(expr, "amdgcn.div.fmas")
201 .getValue();
202 case AMDGPU::BI__builtin_amdgcn_ds_swizzle:
203 return emitBuiltinWithOneOverloadedType<2>(expr, "amdgcn.ds.swizzle")
204 .getValue();
205 case AMDGPU::BI__builtin_amdgcn_mov_dpp8:
206 case AMDGPU::BI__builtin_amdgcn_mov_dpp:
207 case AMDGPU::BI__builtin_amdgcn_update_dpp: {
208 cgm.errorNYI(expr->getSourceRange(),
209 std::string("unimplemented AMDGPU builtin call: ") +
210 getContext().BuiltinInfo.getName(builtinId));
211 return mlir::Value{};
212 }
213 case AMDGPU::BI__builtin_amdgcn_permlane16:
214 case AMDGPU::BI__builtin_amdgcn_permlanex16:
215 case AMDGPU::BI__builtin_amdgcn_permlane64: {
216 cgm.errorNYI(expr->getSourceRange(),
217 std::string("unimplemented AMDGPU builtin call: ") +
218 getContext().BuiltinInfo.getName(builtinId));
219 return mlir::Value{};
220 }
221 case AMDGPU::BI__builtin_amdgcn_readlane:
222 return emitBuiltinWithOneOverloadedType<2>(expr, "amdgcn.readlane")
223 .getValue();
224 case AMDGPU::BI__builtin_amdgcn_readfirstlane:
225 return emitBuiltinWithOneOverloadedType<1>(expr, "amdgcn.readfirstlane")
226 .getValue();
227 case AMDGPU::BI__builtin_amdgcn_wave_shuffle: {
228 cgm.errorNYI(expr->getSourceRange(),
229 std::string("unimplemented AMDGPU builtin call: ") +
230 getContext().BuiltinInfo.getName(builtinId));
231 return mlir::Value{};
232 }
233 case AMDGPU::BI__builtin_amdgcn_div_fixup:
234 case AMDGPU::BI__builtin_amdgcn_div_fixupf:
235 case AMDGPU::BI__builtin_amdgcn_div_fixuph: {
236 cgm.errorNYI(expr->getSourceRange(),
237 std::string("unimplemented AMDGPU builtin call: ") +
238 getContext().BuiltinInfo.getName(builtinId));
239 return mlir::Value{};
240 }
241 case AMDGPU::BI__builtin_amdgcn_trig_preop:
242 case AMDGPU::BI__builtin_amdgcn_trig_preopf: {
243 cgm.errorNYI(expr->getSourceRange(),
244 std::string("unimplemented AMDGPU builtin call: ") +
245 getContext().BuiltinInfo.getName(builtinId));
246 return mlir::Value{};
247 }
248 case AMDGPU::BI__builtin_amdgcn_rcp:
249 case AMDGPU::BI__builtin_amdgcn_rcpf:
250 case AMDGPU::BI__builtin_amdgcn_rcph:
251 case AMDGPU::BI__builtin_amdgcn_rcp_bf16: {
252 cgm.errorNYI(expr->getSourceRange(),
253 std::string("unimplemented AMDGPU builtin call: ") +
254 getContext().BuiltinInfo.getName(builtinId));
255 return mlir::Value{};
256 }
257 case AMDGPU::BI__builtin_amdgcn_sqrt:
258 case AMDGPU::BI__builtin_amdgcn_sqrtf:
259 case AMDGPU::BI__builtin_amdgcn_sqrth:
260 case AMDGPU::BI__builtin_amdgcn_sqrt_bf16: {
261 cgm.errorNYI(expr->getSourceRange(),
262 std::string("unimplemented AMDGPU builtin call: ") +
263 getContext().BuiltinInfo.getName(builtinId));
264 return mlir::Value{};
265 }
266 case AMDGPU::BI__builtin_amdgcn_rsq:
267 case AMDGPU::BI__builtin_amdgcn_rsqf:
268 case AMDGPU::BI__builtin_amdgcn_rsqh:
269 case AMDGPU::BI__builtin_amdgcn_rsq_bf16: {
270 cgm.errorNYI(expr->getSourceRange(),
271 std::string("unimplemented AMDGPU builtin call: ") +
272 getContext().BuiltinInfo.getName(builtinId));
273 return mlir::Value{};
274 }
275 case AMDGPU::BI__builtin_amdgcn_rsq_clamp:
276 case AMDGPU::BI__builtin_amdgcn_rsq_clampf: {
277 cgm.errorNYI(expr->getSourceRange(),
278 std::string("unimplemented AMDGPU builtin call: ") +
279 getContext().BuiltinInfo.getName(builtinId));
280 return mlir::Value{};
281 }
282 case AMDGPU::BI__builtin_amdgcn_sinf:
283 case AMDGPU::BI__builtin_amdgcn_sinh:
284 case AMDGPU::BI__builtin_amdgcn_sin_bf16: {
285 cgm.errorNYI(expr->getSourceRange(),
286 std::string("unimplemented AMDGPU builtin call: ") +
287 getContext().BuiltinInfo.getName(builtinId));
288 return mlir::Value{};
289 }
290 case AMDGPU::BI__builtin_amdgcn_cosf:
291 case AMDGPU::BI__builtin_amdgcn_cosh:
292 case AMDGPU::BI__builtin_amdgcn_cos_bf16: {
293 cgm.errorNYI(expr->getSourceRange(),
294 std::string("unimplemented AMDGPU builtin call: ") +
295 getContext().BuiltinInfo.getName(builtinId));
296 return mlir::Value{};
297 }
298 case AMDGPU::BI__builtin_amdgcn_dispatch_ptr:
299 return emitAMDGPUDispatchPtr(*this, expr);
300 case AMDGPU::BI__builtin_amdgcn_logf:
301 case AMDGPU::BI__builtin_amdgcn_log_bf16: {
302 cgm.errorNYI(expr->getSourceRange(),
303 std::string("unimplemented AMDGPU builtin call: ") +
304 getContext().BuiltinInfo.getName(builtinId));
305 return mlir::Value{};
306 }
307 case AMDGPU::BI__builtin_amdgcn_exp2f:
308 case AMDGPU::BI__builtin_amdgcn_exp2_bf16: {
309 cgm.errorNYI(expr->getSourceRange(),
310 std::string("unimplemented AMDGPU builtin call: ") +
311 getContext().BuiltinInfo.getName(builtinId));
312 return mlir::Value{};
313 }
314 case AMDGPU::BI__builtin_amdgcn_log_clampf: {
315 cgm.errorNYI(expr->getSourceRange(),
316 std::string("unimplemented AMDGPU builtin call: ") +
317 getContext().BuiltinInfo.getName(builtinId));
318 return mlir::Value{};
319 }
320 case AMDGPU::BI__builtin_amdgcn_ldexp:
321 case AMDGPU::BI__builtin_amdgcn_ldexpf:
322 case AMDGPU::BI__builtin_amdgcn_ldexph: {
323 cgm.errorNYI(expr->getSourceRange(),
324 std::string("unimplemented AMDGPU builtin call: ") +
325 getContext().BuiltinInfo.getName(builtinId));
326 return mlir::Value{};
327 }
328 case AMDGPU::BI__builtin_amdgcn_frexp_mant:
329 case AMDGPU::BI__builtin_amdgcn_frexp_mantf:
330 case AMDGPU::BI__builtin_amdgcn_frexp_manth: {
331 cgm.errorNYI(expr->getSourceRange(),
332 std::string("unimplemented AMDGPU builtin call: ") +
333 getContext().BuiltinInfo.getName(builtinId));
334 return mlir::Value{};
335 }
336 case AMDGPU::BI__builtin_amdgcn_frexp_exp:
337 case AMDGPU::BI__builtin_amdgcn_frexp_expf:
338 case AMDGPU::BI__builtin_amdgcn_frexp_exph: {
339 cgm.errorNYI(expr->getSourceRange(),
340 std::string("unimplemented AMDGPU builtin call: ") +
341 getContext().BuiltinInfo.getName(builtinId));
342 return mlir::Value{};
343 }
344 case AMDGPU::BI__builtin_amdgcn_fract:
345 case AMDGPU::BI__builtin_amdgcn_fractf:
346 case AMDGPU::BI__builtin_amdgcn_fracth: {
347 cgm.errorNYI(expr->getSourceRange(),
348 std::string("unimplemented AMDGPU builtin call: ") +
349 getContext().BuiltinInfo.getName(builtinId));
350 return mlir::Value{};
351 }
352 case AMDGPU::BI__builtin_amdgcn_lerp: {
353 cgm.errorNYI(expr->getSourceRange(),
354 std::string("unimplemented AMDGPU builtin call: ") +
355 getContext().BuiltinInfo.getName(builtinId));
356 return mlir::Value{};
357 }
358 case AMDGPU::BI__builtin_amdgcn_ubfe: {
359 cgm.errorNYI(expr->getSourceRange(),
360 std::string("unimplemented AMDGPU builtin call: ") +
361 getContext().BuiltinInfo.getName(builtinId));
362 return mlir::Value{};
363 }
364 case AMDGPU::BI__builtin_amdgcn_sbfe: {
365 cgm.errorNYI(expr->getSourceRange(),
366 std::string("unimplemented AMDGPU builtin call: ") +
367 getContext().BuiltinInfo.getName(builtinId));
368 return mlir::Value{};
369 }
370 case AMDGPU::BI__builtin_amdgcn_ballot_w32:
371 case AMDGPU::BI__builtin_amdgcn_ballot_w64: {
372 cgm.errorNYI(expr->getSourceRange(),
373 std::string("unimplemented AMDGPU builtin call: ") +
374 getContext().BuiltinInfo.getName(builtinId));
375 return mlir::Value{};
376 }
377 case AMDGPU::BI__builtin_amdgcn_inverse_ballot_w32:
378 case AMDGPU::BI__builtin_amdgcn_inverse_ballot_w64: {
379 cgm.errorNYI(expr->getSourceRange(),
380 std::string("unimplemented AMDGPU builtin call: ") +
381 getContext().BuiltinInfo.getName(builtinId));
382 return mlir::Value{};
383 }
384 case AMDGPU::BI__builtin_amdgcn_tanhf:
385 case AMDGPU::BI__builtin_amdgcn_tanhh:
386 case AMDGPU::BI__builtin_amdgcn_tanh_bf16: {
387 cgm.errorNYI(expr->getSourceRange(),
388 std::string("unimplemented AMDGPU builtin call: ") +
389 getContext().BuiltinInfo.getName(builtinId));
390 return mlir::Value{};
391 }
392 case AMDGPU::BI__builtin_amdgcn_uicmp:
393 case AMDGPU::BI__builtin_amdgcn_uicmpl:
394 case AMDGPU::BI__builtin_amdgcn_sicmp:
395 case AMDGPU::BI__builtin_amdgcn_sicmpl: {
396 cgm.errorNYI(expr->getSourceRange(),
397 std::string("unimplemented AMDGPU builtin call: ") +
398 getContext().BuiltinInfo.getName(builtinId));
399 return mlir::Value{};
400 }
401 case AMDGPU::BI__builtin_amdgcn_fcmp:
402 case AMDGPU::BI__builtin_amdgcn_fcmpf: {
403 cgm.errorNYI(expr->getSourceRange(),
404 std::string("unimplemented AMDGPU builtin call: ") +
405 getContext().BuiltinInfo.getName(builtinId));
406 return mlir::Value{};
407 }
408 case AMDGPU::BI__builtin_amdgcn_class:
409 case AMDGPU::BI__builtin_amdgcn_classf:
410 case AMDGPU::BI__builtin_amdgcn_classh: {
411 cgm.errorNYI(expr->getSourceRange(),
412 std::string("unimplemented AMDGPU builtin call: ") +
413 getContext().BuiltinInfo.getName(builtinId));
414 return mlir::Value{};
415 }
416 case AMDGPU::BI__builtin_amdgcn_fmed3f:
417 case AMDGPU::BI__builtin_amdgcn_fmed3h: {
418 cgm.errorNYI(expr->getSourceRange(),
419 std::string("unimplemented AMDGPU builtin call: ") +
420 getContext().BuiltinInfo.getName(builtinId));
421 return mlir::Value{};
422 }
423 case AMDGPU::BI__builtin_amdgcn_ds_append:
424 case AMDGPU::BI__builtin_amdgcn_ds_consume: {
425 cgm.errorNYI(expr->getSourceRange(),
426 std::string("unimplemented AMDGPU builtin call: ") +
427 getContext().BuiltinInfo.getName(builtinId));
428 return mlir::Value{};
429 }
430 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b64_i32:
431 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b64_v2i32:
432 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4i16:
433 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4f16:
434 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4bf16:
435 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8i16:
436 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8f16:
437 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8bf16:
438 case AMDGPU::BI__builtin_amdgcn_global_load_tr4_b64_v2i32:
439 case AMDGPU::BI__builtin_amdgcn_global_load_tr8_b64_v2i32:
440 case AMDGPU::BI__builtin_amdgcn_global_load_tr6_b96_v3i32:
441 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8i16:
442 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8f16:
443 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8bf16: {
444 cgm.errorNYI(expr->getSourceRange(),
445 std::string("unimplemented AMDGPU builtin call: ") +
446 getContext().BuiltinInfo.getName(builtinId));
447 return mlir::Value{};
448 }
449 case AMDGPU::BI__builtin_amdgcn_ds_load_tr4_b64_v2i32:
450 case AMDGPU::BI__builtin_amdgcn_ds_load_tr8_b64_v2i32:
451 case AMDGPU::BI__builtin_amdgcn_ds_load_tr6_b96_v3i32:
452 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8i16:
453 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8f16:
454 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8bf16: {
455 cgm.errorNYI(expr->getSourceRange(),
456 std::string("unimplemented AMDGPU builtin call: ") +
457 getContext().BuiltinInfo.getName(builtinId));
458 return mlir::Value{};
459 }
460 case AMDGPU::BI__builtin_amdgcn_ds_read_tr4_b64_v2i32:
461 case AMDGPU::BI__builtin_amdgcn_ds_read_tr8_b64_v2i32:
462 case AMDGPU::BI__builtin_amdgcn_ds_read_tr6_b96_v3i32:
463 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4f16:
464 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4bf16:
465 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4i16: {
466 cgm.errorNYI(expr->getSourceRange(),
467 std::string("unimplemented AMDGPU builtin call: ") +
468 getContext().BuiltinInfo.getName(builtinId));
469 return mlir::Value{};
470 }
471 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b32:
472 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b64:
473 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b128:
474 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b32:
475 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b64:
476 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b128: {
477 cgm.errorNYI(expr->getSourceRange(),
478 std::string("unimplemented AMDGPU builtin call: ") +
479 getContext().BuiltinInfo.getName(builtinId));
480 return mlir::Value{};
481 }
482 case AMDGPU::BI__builtin_amdgcn_cluster_load_b32:
483 case AMDGPU::BI__builtin_amdgcn_cluster_load_b64:
484 case AMDGPU::BI__builtin_amdgcn_cluster_load_b128: {
485 cgm.errorNYI(expr->getSourceRange(),
486 std::string("unimplemented AMDGPU builtin call: ") +
487 getContext().BuiltinInfo.getName(builtinId));
488 return mlir::Value{};
489 }
490 case AMDGPU::BI__builtin_amdgcn_load_to_lds: {
491 cgm.errorNYI(expr->getSourceRange(),
492 std::string("unimplemented AMDGPU builtin call: ") +
493 getContext().BuiltinInfo.getName(builtinId));
494 return mlir::Value{};
495 }
496 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_32x4B:
497 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_32x4B:
498 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_16x8B:
499 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_16x8B:
500 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_8x16B:
501 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_8x16B: {
502 cgm.errorNYI(expr->getSourceRange(),
503 std::string("unimplemented AMDGPU builtin call: ") +
504 getContext().BuiltinInfo.getName(builtinId));
505 return mlir::Value{};
506 }
507 case AMDGPU::BI__builtin_amdgcn_get_fpenv:
508 case AMDGPU::BI__builtin_amdgcn_set_fpenv: {
509 cgm.errorNYI(expr->getSourceRange(),
510 std::string("unimplemented AMDGPU builtin call: ") +
511 getContext().BuiltinInfo.getName(builtinId));
512 return mlir::Value{};
513 }
514 case AMDGPU::BI__builtin_amdgcn_read_exec:
515 case AMDGPU::BI__builtin_amdgcn_read_exec_lo:
516 case AMDGPU::BI__builtin_amdgcn_read_exec_hi: {
517 cgm.errorNYI(expr->getSourceRange(),
518 std::string("unimplemented AMDGPU builtin call: ") +
519 getContext().BuiltinInfo.getName(builtinId));
520 return mlir::Value{};
521 }
522 case AMDGPU::BI__builtin_amdgcn_image_bvh_intersect_ray:
523 case AMDGPU::BI__builtin_amdgcn_image_bvh_intersect_ray_h:
524 case AMDGPU::BI__builtin_amdgcn_image_bvh_intersect_ray_l:
525 case AMDGPU::BI__builtin_amdgcn_image_bvh_intersect_ray_lh: {
526 cgm.errorNYI(expr->getSourceRange(),
527 std::string("unimplemented AMDGPU builtin call: ") +
528 getContext().BuiltinInfo.getName(builtinId));
529 return mlir::Value{};
530 }
531 case AMDGPU::BI__builtin_amdgcn_image_bvh8_intersect_ray:
532 case AMDGPU::BI__builtin_amdgcn_image_bvh_dual_intersect_ray: {
533 cgm.errorNYI(expr->getSourceRange(),
534 std::string("unimplemented AMDGPU builtin call: ") +
535 getContext().BuiltinInfo.getName(builtinId));
536 return mlir::Value{};
537 }
538 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_rtn:
539 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push4_pop1_rtn:
540 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push8_pop1_rtn:
541 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push8_pop2_rtn: {
542 cgm.errorNYI(expr->getSourceRange(),
543 std::string("unimplemented AMDGPU builtin call: ") +
544 getContext().BuiltinInfo.getName(builtinId));
545 return mlir::Value{};
546 }
547 case AMDGPU::BI__builtin_amdgcn_image_load_1d_v4f32_i32:
548 case AMDGPU::BI__builtin_amdgcn_image_load_1d_v4f16_i32:
550 "amdgcn.image.load.1d", false);
551 case AMDGPU::BI__builtin_amdgcn_image_load_1darray_v4f32_i32:
552 case AMDGPU::BI__builtin_amdgcn_image_load_1darray_v4f16_i32:
554 *this, expr, "amdgcn.image.load.1darray", false);
555 case AMDGPU::BI__builtin_amdgcn_image_load_2d_f32_i32:
556 case AMDGPU::BI__builtin_amdgcn_image_load_2d_v4f32_i32:
557 case AMDGPU::BI__builtin_amdgcn_image_load_2d_v4f16_i32:
559 "amdgcn.image.load.2d", false);
560 case AMDGPU::BI__builtin_amdgcn_image_load_2darray_f32_i32:
561 case AMDGPU::BI__builtin_amdgcn_image_load_2darray_v4f32_i32:
562 case AMDGPU::BI__builtin_amdgcn_image_load_2darray_v4f16_i32:
564 *this, expr, "amdgcn.image.load.2darray", false);
565 case AMDGPU::BI__builtin_amdgcn_image_load_3d_v4f32_i32:
566 case AMDGPU::BI__builtin_amdgcn_image_load_3d_v4f16_i32:
568 "amdgcn.image.load.3d", false);
569 case AMDGPU::BI__builtin_amdgcn_image_load_cube_v4f32_i32:
570 case AMDGPU::BI__builtin_amdgcn_image_load_cube_v4f16_i32:
572 "amdgcn.image.load.cube", false);
573 case AMDGPU::BI__builtin_amdgcn_image_load_mip_1d_v4f32_i32:
574 case AMDGPU::BI__builtin_amdgcn_image_load_mip_1d_v4f16_i32:
576 *this, expr, "amdgcn.image.load.mip.1d", false);
577 case AMDGPU::BI__builtin_amdgcn_image_load_mip_1darray_v4f32_i32:
578 case AMDGPU::BI__builtin_amdgcn_image_load_mip_1darray_v4f16_i32:
580 *this, expr, "amdgcn.image.load.mip.1darray", false);
581 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2d_f32_i32:
582 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2d_v4f32_i32:
583 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2d_v4f16_i32:
585 *this, expr, "amdgcn.image.load.mip.2d", false);
586 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2darray_f32_i32:
587 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2darray_v4f32_i32:
588 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2darray_v4f16_i32:
590 *this, expr, "amdgcn.image.load.mip.2darray", false);
591 case AMDGPU::BI__builtin_amdgcn_image_load_mip_3d_v4f32_i32:
592 case AMDGPU::BI__builtin_amdgcn_image_load_mip_3d_v4f16_i32:
594 *this, expr, "amdgcn.image.load.mip.3d", false);
595 case AMDGPU::BI__builtin_amdgcn_image_load_mip_cube_v4f32_i32:
596 case AMDGPU::BI__builtin_amdgcn_image_load_mip_cube_v4f16_i32:
598 *this, expr, "amdgcn.image.load.mip.cube", false);
599 case AMDGPU::BI__builtin_amdgcn_image_store_1d_v4f32_i32:
600 case AMDGPU::BI__builtin_amdgcn_image_store_1d_v4f16_i32:
602 "amdgcn.image.store.1d", true);
603 case AMDGPU::BI__builtin_amdgcn_image_store_1darray_v4f32_i32:
604 case AMDGPU::BI__builtin_amdgcn_image_store_1darray_v4f16_i32:
606 *this, expr, "amdgcn.image.store.1darray", true);
607 case AMDGPU::BI__builtin_amdgcn_image_store_2d_f32_i32:
608 case AMDGPU::BI__builtin_amdgcn_image_store_2d_v4f32_i32:
609 case AMDGPU::BI__builtin_amdgcn_image_store_2d_v4f16_i32:
611 "amdgcn.image.store.2d", true);
612 case AMDGPU::BI__builtin_amdgcn_image_store_2darray_f32_i32:
613 case AMDGPU::BI__builtin_amdgcn_image_store_2darray_v4f32_i32:
614 case AMDGPU::BI__builtin_amdgcn_image_store_2darray_v4f16_i32:
616 *this, expr, "amdgcn.image.store.2darray", true);
617 case AMDGPU::BI__builtin_amdgcn_image_store_3d_v4f32_i32:
618 case AMDGPU::BI__builtin_amdgcn_image_store_3d_v4f16_i32:
620 "amdgcn.image.store.3d", true);
621 case AMDGPU::BI__builtin_amdgcn_image_store_cube_v4f32_i32:
622 case AMDGPU::BI__builtin_amdgcn_image_store_cube_v4f16_i32:
624 "amdgcn.image.store.cube", true);
625 case AMDGPU::BI__builtin_amdgcn_image_store_mip_1d_v4f32_i32:
626 case AMDGPU::BI__builtin_amdgcn_image_store_mip_1d_v4f16_i32:
628 *this, expr, "amdgcn.image.store.mip.1d", true);
629 case AMDGPU::BI__builtin_amdgcn_image_store_mip_1darray_v4f32_i32:
630 case AMDGPU::BI__builtin_amdgcn_image_store_mip_1darray_v4f16_i32:
632 *this, expr, "amdgcn.image.store.mip.1darray", true);
633 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2d_f32_i32:
634 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2d_v4f32_i32:
635 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2d_v4f16_i32:
637 *this, expr, "amdgcn.image.store.mip.2d", true);
638 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2darray_f32_i32:
639 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2darray_v4f32_i32:
640 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2darray_v4f16_i32:
642 *this, expr, "amdgcn.image.store.mip.2darray", true);
643 case AMDGPU::BI__builtin_amdgcn_image_store_mip_3d_v4f32_i32:
644 case AMDGPU::BI__builtin_amdgcn_image_store_mip_3d_v4f16_i32:
646 *this, expr, "amdgcn.image.store.mip.3d", true);
647 case AMDGPU::BI__builtin_amdgcn_image_store_mip_cube_v4f32_i32:
648 case AMDGPU::BI__builtin_amdgcn_image_store_mip_cube_v4f16_i32:
650 *this, expr, "amdgcn.image.store.mip.cube", true);
651 case AMDGPU::BI__builtin_amdgcn_image_sample_1d_v4f32_f32:
652 case AMDGPU::BI__builtin_amdgcn_image_sample_1d_v4f16_f32:
653 case AMDGPU::BI__builtin_amdgcn_image_sample_1darray_v4f32_f32:
654 case AMDGPU::BI__builtin_amdgcn_image_sample_1darray_v4f16_f32:
655 case AMDGPU::BI__builtin_amdgcn_image_sample_2d_f32_f32:
656 case AMDGPU::BI__builtin_amdgcn_image_sample_2d_v4f32_f32:
657 case AMDGPU::BI__builtin_amdgcn_image_sample_2d_v4f16_f32:
658 case AMDGPU::BI__builtin_amdgcn_image_sample_2darray_f32_f32:
659 case AMDGPU::BI__builtin_amdgcn_image_sample_2darray_v4f32_f32:
660 case AMDGPU::BI__builtin_amdgcn_image_sample_2darray_v4f16_f32:
661 case AMDGPU::BI__builtin_amdgcn_image_sample_3d_v4f32_f32:
662 case AMDGPU::BI__builtin_amdgcn_image_sample_3d_v4f16_f32:
663 case AMDGPU::BI__builtin_amdgcn_image_sample_cube_v4f32_f32:
664 case AMDGPU::BI__builtin_amdgcn_image_sample_cube_v4f16_f32:
665 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_1d_v4f32_f32:
666 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_1d_v4f16_f32:
667 case AMDGPU::BI__builtin_amdgcn_image_sample_l_1d_v4f32_f32:
668 case AMDGPU::BI__builtin_amdgcn_image_sample_l_1d_v4f16_f32:
669 case AMDGPU::BI__builtin_amdgcn_image_sample_d_1d_v4f32_f32:
670 case AMDGPU::BI__builtin_amdgcn_image_sample_d_1d_v4f16_f32:
671 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_2d_v4f32_f32:
672 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_2d_v4f16_f32:
673 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_2d_f32_f32:
674 case AMDGPU::BI__builtin_amdgcn_image_sample_l_2d_v4f32_f32:
675 case AMDGPU::BI__builtin_amdgcn_image_sample_l_2d_v4f16_f32:
676 case AMDGPU::BI__builtin_amdgcn_image_sample_l_2d_f32_f32:
677 case AMDGPU::BI__builtin_amdgcn_image_sample_d_2d_v4f32_f32:
678 case AMDGPU::BI__builtin_amdgcn_image_sample_d_2d_v4f16_f32:
679 case AMDGPU::BI__builtin_amdgcn_image_sample_d_2d_f32_f32:
680 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_3d_v4f32_f32:
681 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_3d_v4f16_f32:
682 case AMDGPU::BI__builtin_amdgcn_image_sample_l_3d_v4f32_f32:
683 case AMDGPU::BI__builtin_amdgcn_image_sample_l_3d_v4f16_f32:
684 case AMDGPU::BI__builtin_amdgcn_image_sample_d_3d_v4f32_f32:
685 case AMDGPU::BI__builtin_amdgcn_image_sample_d_3d_v4f16_f32:
686 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_cube_v4f32_f32:
687 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_cube_v4f16_f32:
688 case AMDGPU::BI__builtin_amdgcn_image_sample_l_cube_v4f32_f32:
689 case AMDGPU::BI__builtin_amdgcn_image_sample_l_cube_v4f16_f32:
690 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_1darray_v4f32_f32:
691 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_1darray_v4f16_f32:
692 case AMDGPU::BI__builtin_amdgcn_image_sample_l_1darray_v4f32_f32:
693 case AMDGPU::BI__builtin_amdgcn_image_sample_l_1darray_v4f16_f32:
694 case AMDGPU::BI__builtin_amdgcn_image_sample_d_1darray_v4f32_f32:
695 case AMDGPU::BI__builtin_amdgcn_image_sample_d_1darray_v4f16_f32:
696 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_2darray_v4f32_f32:
697 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_2darray_v4f16_f32:
698 case AMDGPU::BI__builtin_amdgcn_image_sample_lz_2darray_f32_f32:
699 case AMDGPU::BI__builtin_amdgcn_image_sample_l_2darray_v4f32_f32:
700 case AMDGPU::BI__builtin_amdgcn_image_sample_l_2darray_v4f16_f32:
701 case AMDGPU::BI__builtin_amdgcn_image_sample_l_2darray_f32_f32:
702 case AMDGPU::BI__builtin_amdgcn_image_sample_d_2darray_v4f32_f32:
703 case AMDGPU::BI__builtin_amdgcn_image_sample_d_2darray_v4f16_f32:
704 case AMDGPU::BI__builtin_amdgcn_image_sample_d_2darray_f32_f32: {
705 cgm.errorNYI(expr->getSourceRange(),
706 std::string("unimplemented AMDGPU builtin call: ") +
707 getContext().BuiltinInfo.getName(builtinId));
708 return mlir::Value{};
709 }
710 case AMDGPU::BI__builtin_amdgcn_image_gather4_lz_2d_v4f32_f32: {
711 cgm.errorNYI(expr->getSourceRange(),
712 std::string("unimplemented AMDGPU builtin call: ") +
713 getContext().BuiltinInfo.getName(builtinId));
714 return mlir::Value{};
715 }
716 case AMDGPU::BI__builtin_amdgcn_mfma_scale_f32_16x16x128_f8f6f4:
717 case AMDGPU::BI__builtin_amdgcn_mfma_scale_f32_32x32x64_f8f6f4: {
718 cgm.errorNYI(expr->getSourceRange(),
719 std::string("unimplemented AMDGPU builtin call: ") +
720 getContext().BuiltinInfo.getName(builtinId));
721 return mlir::Value{};
722 }
723 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w32:
724 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_tied_w32:
725 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w64:
726 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_tied_w64:
727 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w32:
728 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_tied_w32:
729 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w64:
730 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_tied_w64:
731 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w32:
732 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w64:
733 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w32:
734 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w64:
735 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w32:
736 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w64:
737 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w32:
738 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w64:
739 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w32_gfx12:
740 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w64_gfx12:
741 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w32_gfx12:
742 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w64_gfx12:
743 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w32_gfx12:
744 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w64_gfx12:
745 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w32_gfx12:
746 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w64_gfx12:
747 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w32_gfx12:
748 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w64_gfx12:
749 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w32_gfx12:
750 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w64_gfx12:
751 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_fp8_w32_gfx12:
752 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_fp8_w64_gfx12:
753 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_bf8_w32_gfx12:
754 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_bf8_w64_gfx12:
755 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_fp8_w32_gfx12:
756 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_fp8_w64_gfx12:
757 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_bf8_w32_gfx12:
758 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_bf8_w64_gfx12:
759 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x32_iu4_w32_gfx12:
760 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x32_iu4_w64_gfx12: {
761 cgm.errorNYI(expr->getSourceRange(),
762 std::string("unimplemented AMDGPU builtin call: ") +
763 getContext().BuiltinInfo.getName(builtinId));
764 return mlir::Value{};
765 }
766 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_f16_w32:
767 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_f16_w64:
768 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf16_w32:
769 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf16_w64:
770 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x32_f16_w32:
771 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x32_f16_w64:
772 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x32_bf16_w32:
773 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x32_bf16_w64:
774 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu8_w32:
775 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu8_w64:
776 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu4_w32:
777 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu4_w64:
778 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x64_iu4_w32:
779 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x64_iu4_w64:
780 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_fp8_w32:
781 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_fp8_w64:
782 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_bf8_w32:
783 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_bf8_w64:
784 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_fp8_w32:
785 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_fp8_w64:
786 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_bf8_w32:
787 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_bf8_w64: {
788 cgm.errorNYI(expr->getSourceRange(),
789 std::string("unimplemented AMDGPU builtin call: ") +
790 getContext().BuiltinInfo.getName(builtinId));
791 return mlir::Value{};
792 }
793 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x4_f32:
794 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x32_bf16:
795 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x32_f16:
796 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x32_f16:
797 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x32_bf16:
798 case AMDGPU::BI__builtin_amdgcn_wmma_bf16f32_16x16x32_bf16:
799 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_fp8_fp8:
800 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_fp8_bf8:
801 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_bf8_fp8:
802 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_bf8_bf8:
803 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_fp8_fp8:
804 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_fp8_bf8:
805 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_bf8_fp8:
806 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_bf8_bf8:
807 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_fp8_fp8:
808 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_fp8_bf8:
809 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_bf8_fp8:
810 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_bf8_bf8:
811 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_fp8_fp8:
812 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_fp8_bf8:
813 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_bf8_fp8:
814 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_bf8_bf8:
815 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x64_iu8:
816 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_f8f6f4:
817 case AMDGPU::BI__builtin_amdgcn_wmma_f32_32x16x128_f4:
818 case AMDGPU::BI__builtin_amdgcn_wmma_scale_f32_16x16x128_f8f6f4:
819 case AMDGPU::BI__builtin_amdgcn_wmma_scale16_f32_16x16x128_f8f6f4:
820 case AMDGPU::BI__builtin_amdgcn_wmma_scale_f32_32x16x128_f4:
821 case AMDGPU::BI__builtin_amdgcn_wmma_scale16_f32_32x16x128_f4: {
822 cgm.errorNYI(expr->getSourceRange(),
823 std::string("unimplemented AMDGPU builtin call: ") +
824 getContext().BuiltinInfo.getName(builtinId));
825 return mlir::Value{};
826 }
827 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x64_f16:
828 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x64_bf16:
829 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x64_f16:
830 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x64_bf16:
831 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16f32_16x16x64_bf16:
832 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_fp8_fp8:
833 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_fp8_bf8:
834 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_bf8_fp8:
835 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_bf8_bf8:
836 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_fp8_fp8:
837 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_fp8_bf8:
838 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_bf8_fp8:
839 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_bf8_bf8:
840 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x128_iu8: {
841 cgm.errorNYI(expr->getSourceRange(),
842 std::string("unimplemented AMDGPU builtin call: ") +
843 getContext().BuiltinInfo.getName(builtinId));
844 return mlir::Value{};
845 }
846 // amdgcn workgroup size
847 case AMDGPU::BI__builtin_amdgcn_workgroup_size_x:
848 case AMDGPU::BI__builtin_amdgcn_workgroup_size_y:
849 case AMDGPU::BI__builtin_amdgcn_workgroup_size_z: {
850 cgm.errorNYI(expr->getSourceRange(),
851 std::string("unimplemented AMDGPU builtin call: ") +
852 getContext().BuiltinInfo.getName(builtinId));
853 return mlir::Value{};
854 }
855 case AMDGPU::BI__builtin_amdgcn_grid_size_x:
856 case AMDGPU::BI__builtin_amdgcn_grid_size_y:
857 case AMDGPU::BI__builtin_amdgcn_grid_size_z: {
858 cgm.errorNYI(expr->getSourceRange(),
859 std::string("unimplemented AMDGPU builtin call: ") +
860 getContext().BuiltinInfo.getName(builtinId));
861 return mlir::Value{};
862 }
863 case AMDGPU::BI__builtin_r600_recipsqrt_ieee:
864 case AMDGPU::BI__builtin_r600_recipsqrt_ieeef: {
865 cgm.errorNYI(expr->getSourceRange(),
866 std::string("unimplemented AMDGPU builtin call: ") +
867 getContext().BuiltinInfo.getName(builtinId));
868 return mlir::Value{};
869 }
870 case AMDGPU::BI__builtin_amdgcn_alignbit: {
871 cgm.errorNYI(expr->getSourceRange(),
872 std::string("unimplemented AMDGPU builtin call: ") +
873 getContext().BuiltinInfo.getName(builtinId));
874 return mlir::Value{};
875 }
876 case AMDGPU::BI__builtin_amdgcn_fence: {
877 cgm.errorNYI(expr->getSourceRange(),
878 std::string("unimplemented AMDGPU builtin call: ") +
879 getContext().BuiltinInfo.getName(builtinId));
880 return mlir::Value{};
881 }
882 case AMDGPU::BI__builtin_amdgcn_atomic_inc32:
883 case AMDGPU::BI__builtin_amdgcn_atomic_inc64:
884 case AMDGPU::BI__builtin_amdgcn_atomic_dec32:
885 case AMDGPU::BI__builtin_amdgcn_atomic_dec64:
886 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_f64:
887 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_f32:
888 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_v2f16:
889 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_v2bf16:
890 case AMDGPU::BI__builtin_amdgcn_ds_faddf:
891 case AMDGPU::BI__builtin_amdgcn_ds_fminf:
892 case AMDGPU::BI__builtin_amdgcn_ds_fmaxf:
893 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_f32:
894 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_f64:
895 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_v2f16:
896 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_v2f16:
897 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_f32:
898 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_f64:
899 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_v2bf16:
900 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_v2bf16:
901 case AMDGPU::BI__builtin_amdgcn_global_atomic_fmin_f64:
902 case AMDGPU::BI__builtin_amdgcn_global_atomic_fmax_f64:
903 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fmin_f64:
904 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fmax_f64: {
905 cgm.errorNYI(expr->getSourceRange(),
906 std::string("unimplemented AMDGPU builtin call: ") +
907 getContext().BuiltinInfo.getName(builtinId));
908 return mlir::Value{};
909 }
910 case AMDGPU::BI__builtin_amdgcn_s_sendmsg_rtn:
911 case AMDGPU::BI__builtin_amdgcn_s_sendmsg_rtnl: {
912 cgm.errorNYI(expr->getSourceRange(),
913 std::string("unimplemented AMDGPU builtin call: ") +
914 getContext().BuiltinInfo.getName(builtinId));
915 return mlir::Value{};
916 }
917 case AMDGPU::BI__builtin_amdgcn_permlane16_swap:
918 case AMDGPU::BI__builtin_amdgcn_permlane32_swap: {
919 cgm.errorNYI(expr->getSourceRange(),
920 std::string("unimplemented AMDGPU builtin call: ") +
921 getContext().BuiltinInfo.getName(builtinId));
922 return mlir::Value{};
923 }
924 case AMDGPU::BI__builtin_amdgcn_bitop3_b32:
925 case AMDGPU::BI__builtin_amdgcn_bitop3_b16: {
926 cgm.errorNYI(expr->getSourceRange(),
927 std::string("unimplemented AMDGPU builtin call: ") +
928 getContext().BuiltinInfo.getName(builtinId));
929 return mlir::Value{};
930 }
931 case AMDGPU::BI__builtin_amdgcn_make_buffer_rsrc: {
932 cgm.errorNYI(expr->getSourceRange(),
933 std::string("unimplemented AMDGPU builtin call: ") +
934 getContext().BuiltinInfo.getName(builtinId));
935 return mlir::Value{};
936 }
937 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b8:
938 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b16:
939 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b32:
940 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b64:
941 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b96:
942 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b128: {
943 cgm.errorNYI(expr->getSourceRange(),
944 std::string("unimplemented AMDGPU builtin call: ") +
945 getContext().BuiltinInfo.getName(builtinId));
946 return mlir::Value{};
947 }
948 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b8:
949 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b16:
950 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b32:
951 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b64:
952 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b96:
953 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b128: {
954 cgm.errorNYI(expr->getSourceRange(),
955 std::string("unimplemented AMDGPU builtin call: ") +
956 getContext().BuiltinInfo.getName(builtinId));
957 return mlir::Value{};
958 }
959 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_add_i32: {
960 cgm.errorNYI(expr->getSourceRange(),
961 std::string("unimplemented AMDGPU builtin call: ") +
962 getContext().BuiltinInfo.getName(builtinId));
963 return mlir::Value{};
964 }
965 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fadd_f32:
966 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fadd_v2f16: {
967 cgm.errorNYI(expr->getSourceRange(),
968 std::string("unimplemented AMDGPU builtin call: ") +
969 getContext().BuiltinInfo.getName(builtinId));
970 return mlir::Value{};
971 }
972 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fmin_f32:
973 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fmin_f64: {
974 cgm.errorNYI(expr->getSourceRange(),
975 std::string("unimplemented AMDGPU builtin call: ") +
976 getContext().BuiltinInfo.getName(builtinId));
977 return mlir::Value{};
978 }
979 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fmax_f32:
980 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fmax_f64: {
981 cgm.errorNYI(expr->getSourceRange(),
982 std::string("unimplemented AMDGPU builtin call: ") +
983 getContext().BuiltinInfo.getName(builtinId));
984 return mlir::Value{};
985 }
986 case AMDGPU::BI__builtin_amdgcn_s_prefetch_data: {
987 cgm.errorNYI(expr->getSourceRange(),
988 std::string("unimplemented AMDGPU builtin call: ") +
989 getContext().BuiltinInfo.getName(builtinId));
990 return mlir::Value{};
991 }
992 case Builtin::BIlogbf:
993 case Builtin::BI__builtin_logbf:
994 return emitLogbBuiltin(*this, expr, llvm::APFloat::IEEEsingle());
995 case Builtin::BIlogb:
996 case Builtin::BI__builtin_logb:
997 return emitLogbBuiltin(*this, expr, llvm::APFloat::IEEEdouble());
998 case Builtin::BIscalbnf:
999 case Builtin::BI__builtin_scalbnf:
1000 case Builtin::BIscalbn:
1001 case Builtin::BI__builtin_scalbn: {
1003 *this, expr, "ldexp", "experimental.constrained.ldexp");
1004 }
1005 default:
1006 return std::nullopt;
1007 }
1008}
static mlir::Value emitAMDGPUDispatchPtr(CIRGenFunction &cgf, const CallExpr *e=nullptr)
static mlir::Value emitLogbBuiltin(CIRGenFunction &cgf, const CallExpr *e, const llvm::fltSemantics &fSem)
static mlir::Value emitAMDGCNImageOverloadedReturnType(CIRGenFunction &cgf, const CallExpr *e, llvm::StringRef intrinsicName, bool isImageStore)
static mlir::Value emitBinaryExpMaybeConstrainedFPBuiltin(CIRGenFunction &cgf, const CallExpr *e, llvm::StringRef intrinsicName, llvm::StringRef constrainedIntrinsicName)
Enumerates target-specific builtins in their own namespaces within namespace clang.
cir::ConstantOp getConstant(mlir::Location loc, mlir::TypedAttr attr)
mlir::Value createAdd(mlir::Location loc, mlir::Value lhs, mlir::Value rhs, OverflowBehavior ob=OverflowBehavior::None)
cir::CmpOp createCompare(mlir::Location loc, cir::CmpOpKind kind, mlir::Value lhs, mlir::Value rhs)
mlir::Value createSelect(mlir::Location loc, mlir::Value condition, mlir::Value trueValue, mlir::Value falseValue)
mlir::Value createAddrSpaceCast(mlir::Location loc, mlir::Value src, mlir::Type newTy)
C++ view class that accepts both !cir.struct and !cir.union types.
Definition CIRTypes.h:93
mlir::Type getElementType() const
Definition Address.h:125
mlir::Value emitIntrinsicCallOp(mlir::Location loc, const llvm::StringRef str, const mlir::Type &resTy, Operands &&...op)
cir::StructType getAnonRecordTy(llvm::ArrayRef< mlir::Type > members, bool packed=false, bool padded=false)
Get a CIR anonymous struct type.
bool getIsFPConstrained() const
Query for the use of constrained floating point math.
mlir::Type convertType(clang::QualType t)
Address emitPointerWithAlignment(const clang::Expr *expr, LValueBaseInfo *baseInfo=nullptr)
Given an expression with a pointer type, emit the value and compute our best estimate of the alignmen...
RValue emitBuiltinWithOneOverloadedType(const CallExpr *e, llvm::StringRef intrinName)
Emit a simple LLVM intrinsic that takes N scalar arguments and whose return type matches the type of ...
mlir::Location getLoc(clang::SourceLocation srcLoc)
Helpers to convert Clang's SourceLocation to a MLIR Location.
std::optional< mlir::Value > emitAMDGPUBuiltinExpr(unsigned builtinID, const CallExpr *expr)
Emit a call to an AMDGPU builtin function.
mlir::Value emitScalarExpr(const clang::Expr *e, bool ignoreResultAssign=false)
Emit the computation of the specified expression of scalar type.
CIRGenBuilderTy & getBuilder()
clang::ASTContext & getContext() const
DiagnosticBuilder errorNYI(SourceLocation, llvm::StringRef)
Helpers to emit "not yet implemented" error diagnostics.
mlir::Value getValue() const
Return the value of this scalar value.
Definition CIRGenValue.h:57
CallExpr - Represents a function call (C99 6.5.2.2, C++ [expr.call]).
Definition Expr.h:2946
Expr * getArg(unsigned Arg)
getArg - Return the specified argument.
Definition Expr.h:3150
unsigned getNumArgs() const
getNumArgs - Return the number of actual arguments to this call.
Definition Expr.h:3137
SourceLocation getExprLoc() const LLVM_READONLY
getExprLoc - Return the preferred location for the arrow when diagnosing a problem with a generic exp...
Definition Expr.cpp:282
QualType getType() const
Definition Expr.h:144
SourceRange getSourceRange() const LLVM_READONLY
SourceLocation tokens are not useful in isolation - they are low level value objects created/interpre...
Definition Stmt.cpp:343
const internal::VariadicDynCastAllOfMatcher< Stmt, Expr > expr
Matches expressions.
The JSON file list parser is used to communicate input to InstallAPI.
#define exp(__x)
Definition tgmath.h:431
#define fabs(__x)
Definition tgmath.h:549