3
3
// RUN: %clang_cc1 -triple x86_64 -S -emit-llvm -o - %s | FileCheck %s
4
4
//
5
5
// Verifies that clang detects memcpy inline version and uses it instead of the builtin.
6
+ // Checks alternate version with the `artificial` attribute.
6
7
7
8
typedef unsigned long size_t ;
8
9
9
10
// Clang requires these attributes for a function to be redefined.
10
11
#define AVAILABLE_EXTERNALLY extern inline __attribute__((always_inline)) __attribute__((gnu_inline))
11
12
13
+ #define AVAILABLE_EXTERNALLY_ALTERNATE extern inline __attribute__((__always_inline__)) __attribute__((__artificial__))
14
+
12
15
// Clang recognizes an inline builtin and renames it to prevent conflict with builtins.
13
16
AVAILABLE_EXTERNALLY void * memcpy (void * a , const void * b , size_t c ) {
14
17
asm("# memcpy.inline marker" );
15
18
return __builtin_memcpy (a , b , c );
16
19
}
17
20
21
+ // Clang recognizes an inline builtin and renames it to prevent conflict with builtins.
22
+ AVAILABLE_EXTERNALLY_ALTERNATE void * memmove (void * a , const void * b , size_t c ) {
23
+ asm("# memmove.inline marker" );
24
+ return __builtin_memmove (a , b , c );
25
+ }
26
+
18
27
// CHECK-LABEL: @foo(
19
28
// CHECK-NEXT: entry:
20
29
// CHECK-NEXT: [[A_ADDR_I:%.*]] = alloca ptr, align 8
@@ -43,6 +52,34 @@ void *foo(void *a, const void *b, size_t c) {
43
52
return memcpy (a , b , c );
44
53
}
45
54
55
+ // CHECK-LABEL: @foo_alt(
56
+ // CHECK-NEXT: entry:
57
+ // CHECK-NEXT: [[A_ADDR_I:%.*]] = alloca ptr, align 8
58
+ // CHECK-NEXT: [[B_ADDR_I:%.*]] = alloca ptr, align 8
59
+ // CHECK-NEXT: [[C_ADDR_I:%.*]] = alloca i64, align 8
60
+ // CHECK-NEXT: [[A_ADDR:%.*]] = alloca ptr, align 8
61
+ // CHECK-NEXT: [[B_ADDR:%.*]] = alloca ptr, align 8
62
+ // CHECK-NEXT: [[C_ADDR:%.*]] = alloca i64, align 8
63
+ // CHECK-NEXT: store ptr [[A:%.*]], ptr [[A_ADDR]], align 8
64
+ // CHECK-NEXT: store ptr [[B:%.*]], ptr [[B_ADDR]], align 8
65
+ // CHECK-NEXT: store i64 [[C:%.*]], ptr [[C_ADDR]], align 8
66
+ // CHECK-NEXT: [[TMP0:%.*]] = load ptr, ptr [[A_ADDR]], align 8
67
+ // CHECK-NEXT: [[TMP1:%.*]] = load ptr, ptr [[B_ADDR]], align 8
68
+ // CHECK-NEXT: [[TMP2:%.*]] = load i64, ptr [[C_ADDR]], align 8
69
+ // CHECK-NEXT: store ptr [[TMP0]], ptr [[A_ADDR_I]], align 8
70
+ // CHECK-NEXT: store ptr [[TMP1]], ptr [[B_ADDR_I]], align 8
71
+ // CHECK-NEXT: store i64 [[TMP2]], ptr [[C_ADDR_I]], align 8
72
+ // CHECK-NEXT: call void asm sideeffect "# memmove.inline marker", "~{dirflag},~{fpsr},~{flags}"() #[[ATTR3]], !srcloc !3
73
+ // CHECK-NEXT: [[TMP3:%.*]] = load ptr, ptr [[A_ADDR_I]], align 8
74
+ // CHECK-NEXT: [[TMP4:%.*]] = load ptr, ptr [[B_ADDR_I]], align 8
75
+ // CHECK-NEXT: [[TMP5:%.*]] = load i64, ptr [[C_ADDR_I]], align 8
76
+ // CHECK-NEXT: call void @llvm.memmove.p0.p0.i64(ptr align 1 [[TMP3]], ptr align 1 [[TMP4]], i64 [[TMP5]], i1 false)
77
+ // CHECK-NEXT: ret ptr [[TMP3]]
78
+ //
79
+ void * foo_alt (void * a , const void * b , size_t c ) {
80
+ return memmove (a , b , c );
81
+ }
82
+
46
83
// CHECK-LABEL: @bar(
47
84
// CHECK-NEXT: entry:
48
85
// CHECK-NEXT: [[A_ADDR:%.*]] = alloca ptr, align 8
@@ -68,3 +105,29 @@ void bar(void *a, const void *b, size_t c) {
68
105
void * (* cpy )(void * , const void * , size_t ) = c > 10 ? memcpy : foo ;
69
106
cpy (a , b , c );
70
107
}
108
+
109
+ // CHECK-LABEL: @bar_alt(
110
+ // CHECK-NEXT: entry:
111
+ // CHECK-NEXT: [[A_ADDR:%.*]] = alloca ptr, align 8
112
+ // CHECK-NEXT: [[B_ADDR:%.*]] = alloca ptr, align 8
113
+ // CHECK-NEXT: [[C_ADDR:%.*]] = alloca i64, align 8
114
+ // CHECK-NEXT: [[CPY:%.*]] = alloca ptr, align 8
115
+ // CHECK-NEXT: store ptr [[A:%.*]], ptr [[A_ADDR]], align 8
116
+ // CHECK-NEXT: store ptr [[B:%.*]], ptr [[B_ADDR]], align 8
117
+ // CHECK-NEXT: store i64 [[C:%.*]], ptr [[C_ADDR]], align 8
118
+ // CHECK-NEXT: [[TMP0:%.*]] = load i64, ptr [[C_ADDR]], align 8
119
+ // CHECK-NEXT: [[CMP:%.*]] = icmp ugt i64 [[TMP0]], 10
120
+ // CHECK-NEXT: [[TMP1:%.*]] = zext i1 [[CMP]] to i64
121
+ // CHECK-NEXT: [[COND:%.*]] = select i1 [[CMP]], ptr @memmove, ptr @foo_alt
122
+ // CHECK-NEXT: store ptr [[COND]], ptr [[CPY]], align 8
123
+ // CHECK-NEXT: [[TMP2:%.*]] = load ptr, ptr [[CPY]], align 8
124
+ // CHECK-NEXT: [[TMP3:%.*]] = load ptr, ptr [[A_ADDR]], align 8
125
+ // CHECK-NEXT: [[TMP4:%.*]] = load ptr, ptr [[B_ADDR]], align 8
126
+ // CHECK-NEXT: [[TMP5:%.*]] = load i64, ptr [[C_ADDR]], align 8
127
+ // CHECK-NEXT: [[CALL:%.*]] = call ptr [[TMP2]](ptr noundef [[TMP3]], ptr noundef [[TMP4]], i64 noundef [[TMP5]])
128
+ // CHECK-NEXT: ret void
129
+ //
130
+ void bar_alt (void * a , const void * b , size_t c ) {
131
+ void * (* cpy )(void * , const void * , size_t ) = c > 10 ? memmove : foo_alt ;
132
+ cpy (a , b , c );
133
+ }
0 commit comments