Skip to content

Commit 2e94f54

Browse files
authored
Merge pull request #745 from GuillaumeGomez/regen
Regenerate intrinsics mapping
2 parents f682d09 + 9fb9910 commit 2e94f54

File tree

1 file changed

+60
-0
lines changed

1 file changed

+60
-0
lines changed

src/intrinsic/archs.rs

Lines changed: 60 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -95,8 +95,11 @@ fn map_arch_intrinsic(full_name: &str) -> &'static str {
9595
"cubema" => "__builtin_amdgcn_cubema",
9696
"cubesc" => "__builtin_amdgcn_cubesc",
9797
"cubetc" => "__builtin_amdgcn_cubetc",
98+
"cvt.f16.bf8" => "__builtin_amdgcn_cvt_f16_bf8",
99+
"cvt.f16.fp8" => "__builtin_amdgcn_cvt_f16_fp8",
98100
"cvt.f32.bf8" => "__builtin_amdgcn_cvt_f32_bf8",
99101
"cvt.f32.fp8" => "__builtin_amdgcn_cvt_f32_fp8",
102+
"cvt.f32.fp8.e5m3" => "__builtin_amdgcn_cvt_f32_fp8_e5m3",
100103
"cvt.off.f32.i4" => "__builtin_amdgcn_cvt_off_f32_i4",
101104
"cvt.pk.bf8.f32" => "__builtin_amdgcn_cvt_pk_bf8_f32",
102105
"cvt.pk.f16.bf8" => "__builtin_amdgcn_cvt_pk_f16_bf8",
@@ -181,6 +184,12 @@ fn map_arch_intrinsic(full_name: &str) -> &'static str {
181184
"dot4.f32.fp8.bf8" => "__builtin_amdgcn_dot4_f32_fp8_bf8",
182185
"dot4.f32.fp8.fp8" => "__builtin_amdgcn_dot4_f32_fp8_fp8",
183186
"ds.add.gs.reg.rtn" => "__builtin_amdgcn_ds_add_gs_reg_rtn",
187+
"ds.atomic.async.barrier.arrive.b64" => {
188+
"__builtin_amdgcn_ds_atomic_async_barrier_arrive_b64"
189+
}
190+
"ds.atomic.barrier.arrive.rtn.b64" => {
191+
"__builtin_amdgcn_ds_atomic_barrier_arrive_rtn_b64"
192+
}
184193
"ds.bpermute" => "__builtin_amdgcn_ds_bpermute",
185194
"ds.bpermute.fi.b32" => "__builtin_amdgcn_ds_bpermute_fi_b32",
186195
"ds.gws.barrier" => "__builtin_amdgcn_ds_gws_barrier",
@@ -198,8 +207,32 @@ fn map_arch_intrinsic(full_name: &str) -> &'static str {
198207
"fdot2.f16.f16" => "__builtin_amdgcn_fdot2_f16_f16",
199208
"fdot2.f32.bf16" => "__builtin_amdgcn_fdot2_f32_bf16",
200209
"fdot2c.f32.bf16" => "__builtin_amdgcn_fdot2c_f32_bf16",
210+
"flat.prefetch" => "__builtin_amdgcn_flat_prefetch",
201211
"fmul.legacy" => "__builtin_amdgcn_fmul_legacy",
212+
"global.load.async.to.lds.b128" => {
213+
"__builtin_amdgcn_global_load_async_to_lds_b128"
214+
}
215+
"global.load.async.to.lds.b32" => {
216+
"__builtin_amdgcn_global_load_async_to_lds_b32"
217+
}
218+
"global.load.async.to.lds.b64" => {
219+
"__builtin_amdgcn_global_load_async_to_lds_b64"
220+
}
221+
"global.load.async.to.lds.b8" => "__builtin_amdgcn_global_load_async_to_lds_b8",
202222
"global.load.lds" => "__builtin_amdgcn_global_load_lds",
223+
"global.prefetch" => "__builtin_amdgcn_global_prefetch",
224+
"global.store.async.from.lds.b128" => {
225+
"__builtin_amdgcn_global_store_async_from_lds_b128"
226+
}
227+
"global.store.async.from.lds.b32" => {
228+
"__builtin_amdgcn_global_store_async_from_lds_b32"
229+
}
230+
"global.store.async.from.lds.b64" => {
231+
"__builtin_amdgcn_global_store_async_from_lds_b64"
232+
}
233+
"global.store.async.from.lds.b8" => {
234+
"__builtin_amdgcn_global_store_async_from_lds_b8"
235+
}
203236
"groupstaticsize" => "__builtin_amdgcn_groupstaticsize",
204237
"iglp.opt" => "__builtin_amdgcn_iglp_opt",
205238
"implicit.buffer.ptr" => "__builtin_amdgcn_implicit_buffer_ptr",
@@ -291,6 +324,7 @@ fn map_arch_intrinsic(full_name: &str) -> &'static str {
291324
"s.incperflevel" => "__builtin_amdgcn_s_incperflevel",
292325
"s.memrealtime" => "__builtin_amdgcn_s_memrealtime",
293326
"s.memtime" => "__builtin_amdgcn_s_memtime",
327+
"s.monitor.sleep" => "__builtin_amdgcn_s_monitor_sleep",
294328
"s.sendmsg" => "__builtin_amdgcn_s_sendmsg",
295329
"s.sendmsghalt" => "__builtin_amdgcn_s_sendmsghalt",
296330
"s.setprio" => "__builtin_amdgcn_s_setprio",
@@ -300,11 +334,15 @@ fn map_arch_intrinsic(full_name: &str) -> &'static str {
300334
"s.sleep.var" => "__builtin_amdgcn_s_sleep_var",
301335
"s.ttracedata" => "__builtin_amdgcn_s_ttracedata",
302336
"s.ttracedata.imm" => "__builtin_amdgcn_s_ttracedata_imm",
337+
"s.wait.asynccnt" => "__builtin_amdgcn_s_wait_asynccnt",
303338
"s.wait.event.export.ready" => "__builtin_amdgcn_s_wait_event_export_ready",
339+
"s.wait.tensorcnt" => "__builtin_amdgcn_s_wait_tensorcnt",
304340
"s.waitcnt" => "__builtin_amdgcn_s_waitcnt",
305341
"sad.hi.u8" => "__builtin_amdgcn_sad_hi_u8",
306342
"sad.u16" => "__builtin_amdgcn_sad_u16",
307343
"sad.u8" => "__builtin_amdgcn_sad_u8",
344+
"sat.pk4.i4.i8" => "__builtin_amdgcn_sat_pk4_i4_i8",
345+
"sat.pk4.u4.u8" => "__builtin_amdgcn_sat_pk4_u4_u8",
308346
"sched.barrier" => "__builtin_amdgcn_sched_barrier",
309347
"sched.group.barrier" => "__builtin_amdgcn_sched_group_barrier",
310348
"sdot2" => "__builtin_amdgcn_sdot2",
@@ -346,8 +384,13 @@ fn map_arch_intrinsic(full_name: &str) -> &'static str {
346384
"smfmac.i32.16x16x64.i8" => "__builtin_amdgcn_smfmac_i32_16x16x64_i8",
347385
"smfmac.i32.32x32x32.i8" => "__builtin_amdgcn_smfmac_i32_32x32x32_i8",
348386
"smfmac.i32.32x32x64.i8" => "__builtin_amdgcn_smfmac_i32_32x32x64_i8",
387+
"struct.ptr.buffer.load.lds" => "__builtin_amdgcn_struct_ptr_buffer_load_lds",
349388
"sudot4" => "__builtin_amdgcn_sudot4",
350389
"sudot8" => "__builtin_amdgcn_sudot8",
390+
"tensor.load.to.lds" => "__builtin_amdgcn_tensor_load_to_lds",
391+
"tensor.load.to.lds.d2" => "__builtin_amdgcn_tensor_load_to_lds_d2",
392+
"tensor.store.from.lds" => "__builtin_amdgcn_tensor_store_from_lds",
393+
"tensor.store.from.lds.d2" => "__builtin_amdgcn_tensor_store_from_lds_d2",
351394
"udot2" => "__builtin_amdgcn_udot2",
352395
"udot4" => "__builtin_amdgcn_udot4",
353396
"udot8" => "__builtin_amdgcn_udot8",
@@ -6326,6 +6369,23 @@ fn map_arch_intrinsic(full_name: &str) -> &'static str {
63266369
}
63276370
s390(name, full_name)
63286371
}
6372+
"spv" => {
6373+
#[allow(non_snake_case)]
6374+
fn spv(name: &str, full_name: &str) -> &'static str {
6375+
match name {
6376+
// spv
6377+
"num.subgroups" => "__builtin_spirv_num_subgroups",
6378+
"subgroup.id" => "__builtin_spirv_subgroup_id",
6379+
"subgroup.local.invocation.id" => {
6380+
"__builtin_spirv_subgroup_local_invocation_id"
6381+
}
6382+
"subgroup.max.size" => "__builtin_spirv_subgroup_max_size",
6383+
"subgroup.size" => "__builtin_spirv_subgroup_size",
6384+
_ => unimplemented!("***** unsupported LLVM intrinsic {full_name}"),
6385+
}
6386+
}
6387+
spv(name, full_name)
6388+
}
63296389
"ve" => {
63306390
#[allow(non_snake_case)]
63316391
fn ve(name: &str, full_name: &str) -> &'static str {

0 commit comments

Comments
 (0)