Run DCE after a LoopFlatten test to reduce spurious output [nfc]
[llvm-project.git] / clang / test / CodeGen / X86 / amx_inline_asm.c
blob24788adfd2cbad0d61adea9753241a834caacd03
1 // RUN: %clang_cc1 %s -ffreestanding -triple=x86_64-unknown-unknown -target-feature +amx-int8 -target-feature +amx-bf16 -emit-llvm -o - -Wall -Werror -pedantic | FileCheck %s
3 void f_tilemul(short a)
5 //CHECK: call void asm sideeffect "tileloadd 0(%rsi,%r13,4), %tmm0 \0A\09tileloadd 0(%rdx,%r14,4), %tmm6 \0A\09tdpbf16ps %tmm6, %tmm0, %tmm7 \0A\09tilestored %tmm7, 0(%r12,%r15,4) \0A\09", "~{memory},~{tmm0},~{tmm6},~{tmm7},~{dirflag},~{fpsr},~{flags}"()
6 __asm__ volatile ("tileloadd 0(%%rsi,%%r13,4), %%tmm0 \n\t"
7 "tileloadd 0(%%rdx,%%r14,4), %%tmm6 \n\t"
8 "tdpbf16ps %%tmm6, %%tmm0, %%tmm7 \n\t"
9 "tilestored %%tmm7, 0(%%r12,%%r15,4) \n\t"
10 ::: "memory", "tmm0", "tmm6", "tmm7");