1 ; RUN: llc -mtriple=x86_64-- < %s | FileCheck %s
3 target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
4 target triple = "x86_64--"
6 ; Function Attrs: nounwind uwtable
7 define { i64, i64 } @foo(i8* %ptr, i128* nocapture readonly %src, i128* nocapture readonly %dst) local_unnamed_addr #0 {
9 %0 = load i128, i128* %dst, align 16, !tbaa !1
10 %shr = lshr i128 %0, 64
11 %conv = trunc i128 %shr to i64
12 %conv1 = trunc i128 %0 to i64
13 %1 = load i128, i128* %src, align 16, !tbaa !1
14 %2 = tail call i128 asm sideeffect "lock; cmpxchg16b $1", "=A,=*m,{cx},{bx},0,*m,~{dirflag},~{fpsr},~{flags}"(i8* %ptr, i64 %conv, i64 %conv1, i128 %1, i8* %ptr) #1, !srcloc !5
15 %retval.sroa.0.0.extract.trunc = trunc i128 %2 to i64
16 %retval.sroa.2.0.extract.shift = lshr i128 %2, 64
17 %retval.sroa.2.0.extract.trunc = trunc i128 %retval.sroa.2.0.extract.shift to i64
18 %.fca.0.insert = insertvalue { i64, i64 } undef, i64 %retval.sroa.0.0.extract.trunc, 0
19 %.fca.1.insert = insertvalue { i64, i64 } %.fca.0.insert, i64 %retval.sroa.2.0.extract.trunc, 1
20 ret { i64, i64 } %.fca.1.insert
23 ; CHECK-NEXT: cmpxchg16b
25 attributes #0 = { nounwind uwtable "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" }
26 attributes #1 = { nounwind }
30 !0 = !{!"clang version 5.0.0 (trunk 300088)"}
32 !2 = !{!"__int128", !3, i64 0}
33 !3 = !{!"omnipotent char", !4, i64 0}
34 !4 = !{!"Simple C/C++ TBAA"}