|  | ; RUN: llc < %s -mtriple=armv7-apple-darwin   | FileCheck %s | 
|  | ; RUN: llc < %s -mtriple=thumbv7-apple-darwin > %t | 
|  | ; RUN: FileCheck %s < %t | 
|  | ; RUN: FileCheck %s < %t --check-prefix=CHECK-T2ADDRMODE | 
|  |  | 
|  | %0 = type { i32, i32 } | 
|  |  | 
|  | ; CHECK-LABEL: f0: | 
|  | ; CHECK: ldrexd | 
|  | define i64 @f0(i8* %p) nounwind readonly { | 
|  | entry: | 
|  | %ldrexd = tail call %0 @llvm.arm.ldrexd(i8* %p) | 
|  | %0 = extractvalue %0 %ldrexd, 1 | 
|  | %1 = extractvalue %0 %ldrexd, 0 | 
|  | %2 = zext i32 %0 to i64 | 
|  | %3 = zext i32 %1 to i64 | 
|  | %shl = shl nuw i64 %2, 32 | 
|  | %4 = or i64 %shl, %3 | 
|  | ret i64 %4 | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: f1: | 
|  | ; CHECK: strexd | 
|  | define i32 @f1(i8* %ptr, i64 %val) nounwind { | 
|  | entry: | 
|  | %tmp4 = trunc i64 %val to i32 | 
|  | %tmp6 = lshr i64 %val, 32 | 
|  | %tmp7 = trunc i64 %tmp6 to i32 | 
|  | %strexd = tail call i32 @llvm.arm.strexd(i32 %tmp4, i32 %tmp7, i8* %ptr) | 
|  | ret i32 %strexd | 
|  | } | 
|  |  | 
|  | declare %0 @llvm.arm.ldrexd(i8*) nounwind readonly | 
|  | declare i32 @llvm.arm.strexd(i32, i32, i8*) nounwind | 
|  |  | 
|  | ; CHECK-LABEL: test_load_i8: | 
|  | ; CHECK: ldrexb r0, [r0] | 
|  | ; CHECK-NOT: uxtb | 
|  | ; CHECK-NOT: and | 
|  | define zeroext i8 @test_load_i8(i8* %addr) { | 
|  | %val = call i32 @llvm.arm.ldrex.p0i8(i8* %addr) | 
|  | %val8 = trunc i32 %val to i8 | 
|  | ret i8 %val8 | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: test_load_i16: | 
|  | ; CHECK: ldrexh r0, [r0] | 
|  | ; CHECK-NOT: uxth | 
|  | ; CHECK-NOT: and | 
|  | define zeroext i16 @test_load_i16(i16* %addr) { | 
|  | %val = call i32 @llvm.arm.ldrex.p0i16(i16* %addr) | 
|  | %val16 = trunc i32 %val to i16 | 
|  | ret i16 %val16 | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: test_load_i32: | 
|  | ; CHECK: ldrex r0, [r0] | 
|  | define i32 @test_load_i32(i32* %addr) { | 
|  | %val = call i32 @llvm.arm.ldrex.p0i32(i32* %addr) | 
|  | ret i32 %val | 
|  | } | 
|  |  | 
|  | declare i32 @llvm.arm.ldrex.p0i8(i8*) nounwind readonly | 
|  | declare i32 @llvm.arm.ldrex.p0i16(i16*) nounwind readonly | 
|  | declare i32 @llvm.arm.ldrex.p0i32(i32*) nounwind readonly | 
|  |  | 
|  | ; CHECK-LABEL: test_store_i8: | 
|  | ; CHECK-NOT: uxtb | 
|  | ; CHECK: strexb r0, r1, [r2] | 
|  | define i32 @test_store_i8(i32, i8 %val, i8* %addr) { | 
|  | %extval = zext i8 %val to i32 | 
|  | %res = call i32 @llvm.arm.strex.p0i8(i32 %extval, i8* %addr) | 
|  | ret i32 %res | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: test_store_i16: | 
|  | ; CHECK-NOT: uxth | 
|  | ; CHECK: strexh r0, r1, [r2] | 
|  | define i32 @test_store_i16(i32, i16 %val, i16* %addr) { | 
|  | %extval = zext i16 %val to i32 | 
|  | %res = call i32 @llvm.arm.strex.p0i16(i32 %extval, i16* %addr) | 
|  | ret i32 %res | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: test_store_i32: | 
|  | ; CHECK: strex r0, r1, [r2] | 
|  | define i32 @test_store_i32(i32, i32 %val, i32* %addr) { | 
|  | %res = call i32 @llvm.arm.strex.p0i32(i32 %val, i32* %addr) | 
|  | ret i32 %res | 
|  | } | 
|  |  | 
|  | declare i32 @llvm.arm.strex.p0i8(i32, i8*) nounwind | 
|  | declare i32 @llvm.arm.strex.p0i16(i32, i16*) nounwind | 
|  | declare i32 @llvm.arm.strex.p0i32(i32, i32*) nounwind | 
|  |  | 
|  | ; CHECK-LABEL: test_clear: | 
|  | ; CHECK: clrex | 
|  | define void @test_clear() { | 
|  | call void @llvm.arm.clrex() | 
|  | ret void | 
|  | } | 
|  |  | 
|  | declare void @llvm.arm.clrex() nounwind | 
|  |  | 
|  | @base = global i32* null | 
|  |  | 
|  | define void @excl_addrmode() { | 
|  | ; CHECK-T2ADDRMODE-LABEL: excl_addrmode: | 
|  | %base1020 = load i32*, i32** @base | 
|  | %offset1020 = getelementptr i32, i32* %base1020, i32 255 | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %offset1020) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %offset1020) | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [{{r[0-9]+}}, #1020] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [{{r[0-9]+}}, #1020] | 
|  |  | 
|  | %base1024 = load i32*, i32** @base | 
|  | %offset1024 = getelementptr i32, i32* %base1024, i32 256 | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %offset1024) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %offset1024) | 
|  | ; CHECK-T2ADDRMODE: add.w r[[ADDR:[0-9]+]], {{r[0-9]+}}, #1024 | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [r[[ADDR]]] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] | 
|  |  | 
|  | %base1 = load i32*, i32** @base | 
|  | %addr8 = bitcast i32* %base1 to i8* | 
|  | %offset1_8 = getelementptr i8, i8* %addr8, i32 1 | 
|  | %offset1 = bitcast i8* %offset1_8 to i32* | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %offset1) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %offset1) | 
|  | ; CHECK-T2ADDRMODE: adds r[[ADDR:[0-9]+]], #1 | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [r[[ADDR]]] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] | 
|  |  | 
|  | %local = alloca i8, i32 1024 | 
|  | %local32 = bitcast i8* %local to i32* | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %local32) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %local32) | 
|  | ; CHECK-T2ADDRMODE: mov r[[ADDR:[0-9]+]], sp | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [r[[ADDR]]] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] | 
|  |  | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define void @test_excl_addrmode_folded() { | 
|  | ; CHECK-LABEL: test_excl_addrmode_folded: | 
|  | %local = alloca i8, i32 4096 | 
|  |  | 
|  | %local.0 = getelementptr i8, i8* %local, i32 4 | 
|  | %local32.0 = bitcast i8* %local.0 to i32* | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %local32.0) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %local32.0) | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [sp, #4] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [sp, #4] | 
|  |  | 
|  | %local.1 = getelementptr i8, i8* %local, i32 1020 | 
|  | %local32.1 = bitcast i8* %local.1 to i32* | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %local32.1) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %local32.1) | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [sp, #1020] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [sp, #1020] | 
|  |  | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define void @test_excl_addrmode_range() { | 
|  | ; CHECK-LABEL: test_excl_addrmode_range: | 
|  | %local = alloca i8, i32 4096 | 
|  |  | 
|  | %local.0 = getelementptr i8, i8* %local, i32 1024 | 
|  | %local32.0 = bitcast i8* %local.0 to i32* | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %local32.0) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %local32.0) | 
|  | ; CHECK-T2ADDRMODE: mov r[[TMP:[0-9]+]], sp | 
|  | ; CHECK-T2ADDRMODE: add.w r[[ADDR:[0-9]+]], r[[TMP]], #1024 | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [r[[ADDR]]] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] | 
|  |  | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define void @test_excl_addrmode_align() { | 
|  | ; CHECK-LABEL: test_excl_addrmode_align: | 
|  | %local = alloca i8, i32 4096 | 
|  |  | 
|  | %local.0 = getelementptr i8, i8* %local, i32 2 | 
|  | %local32.0 = bitcast i8* %local.0 to i32* | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %local32.0) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %local32.0) | 
|  | ; CHECK-T2ADDRMODE: mov r[[ADDR:[0-9]+]], sp | 
|  | ; CHECK-T2ADDRMODE: adds r[[ADDR:[0-9]+]], #2 | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [r[[ADDR]]] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] | 
|  |  | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define void @test_excl_addrmode_sign() { | 
|  | ; CHECK-LABEL: test_excl_addrmode_sign: | 
|  | %local = alloca i8, i32 4096 | 
|  |  | 
|  | %local.0 = getelementptr i8, i8* %local, i32 -4 | 
|  | %local32.0 = bitcast i8* %local.0 to i32* | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %local32.0) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %local32.0) | 
|  | ; CHECK-T2ADDRMODE: mov r[[ADDR:[0-9]+]], sp | 
|  | ; CHECK-T2ADDRMODE: subs r[[ADDR:[0-9]+]], #4 | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [r[[ADDR]]] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] | 
|  |  | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define void @test_excl_addrmode_combination() { | 
|  | ; CHECK-LABEL: test_excl_addrmode_combination: | 
|  | %local = alloca i8, i32 4096 | 
|  | %unused = alloca i8, i32 64 | 
|  |  | 
|  | %local.0 = getelementptr i8, i8* %local, i32 4 | 
|  | %local32.0 = bitcast i8* %local.0 to i32* | 
|  | call i32 @llvm.arm.ldrex.p0i32(i32* %local32.0) | 
|  | call i32 @llvm.arm.strex.p0i32(i32 0, i32* %local32.0) | 
|  | ; CHECK-T2ADDRMODE: ldrex {{r[0-9]+}}, [sp, #68] | 
|  | ; CHECK-T2ADDRMODE: strex {{r[0-9]+}}, {{r[0-9]+}}, [sp, #68] | 
|  |  | 
|  | ret void | 
|  | } | 
|  |  | 
|  |  | 
|  | ; LLVM should know, even across basic blocks, that ldrex is setting the high | 
|  | ; bits of its i32 to 0. There should be no zero-extend operation. | 
|  | define zeroext i8 @test_cross_block_zext_i8(i1 %tst, i8* %addr) { | 
|  | ; CHECK: test_cross_block_zext_i8: | 
|  | ; CHECK-NOT: uxtb | 
|  | ; CHECK-NOT: and | 
|  | ; CHECK: bx lr | 
|  | %val = call i32 @llvm.arm.ldrex.p0i8(i8* %addr) | 
|  | br i1 %tst, label %end, label %mid | 
|  | mid: | 
|  | ret i8 42 | 
|  | end: | 
|  | %val8 = trunc i32 %val to i8 | 
|  | ret i8 %val8 | 
|  | } |