1 // RUN: %clang_cc1 %s -ffreestanding -triple=x86_64-unknown-unknown -target-feature +amx-tf32 -target-feature +amx-transpose -emit-llvm -o - -Wall -Werror -pedantic | FileCheck %s
3 void f_tilemul(short a
)
5 //CHECK: call void asm sideeffect "tileloadd 0(%rsi,%r13,4), %tmm0 \0A\09tileloadd 0(%rdx,%r14,4), %tmm6 \0A\09tmmultf32ps %tmm6, %tmm0, %tmm7 \0A\09tilestored %tmm7, 0(%r12,%r15,4) \0A\09", "~{memory},~{tmm0},~{tmm6},~{tmm7},~{dirflag},~{fpsr},~{flags}"()
6 __asm__
volatile ("tileloadd 0(%%rsi,%%r13,4), %%tmm0 \n\t"
7 "tileloadd 0(%%rdx,%%r14,4), %%tmm6 \n\t"
8 "tmmultf32ps %%tmm6, %%tmm0, %%tmm7 \n\t"
9 "tilestored %%tmm7, 0(%%r12,%%r15,4) \n\t"
10 ::: "memory", "tmm0", "tmm6", "tmm7");
12 //CHECK: call void asm sideeffect "tileloadd 0(%rsi,%r13,4), %tmm0 \0A\09tileloadd 0(%rdx,%r14,4), %tmm6 \0A\09ttmmultf32ps %tmm6, %tmm0, %tmm7 \0A\09tilestored %tmm7, 0(%r12,%r15,4) \0A\09", "~{memory},~{tmm0},~{tmm6},~{tmm7},~{dirflag},~{fpsr},~{flags}"()
13 __asm__
volatile ("tileloadd 0(%%rsi,%%r13,4), %%tmm0 \n\t"
14 "tileloadd 0(%%rdx,%%r14,4), %%tmm6 \n\t"
15 "ttmmultf32ps %%tmm6, %%tmm0, %%tmm7 \n\t"
16 "tilestored %%tmm7, 0(%%r12,%%r15,4) \n\t"
17 ::: "memory", "tmm0", "tmm6", "tmm7");