Skip to content

Commit fd8745c

Browse files
[clang] Do not require GNUInlineAttr for inline builtins
Fix llvm#61691 Differential Revision: https://reviews.llvm.org/D147307
1 parent fd1d608 commit fd8745c

File tree

3 files changed

+65
-3
lines changed

3 files changed

+65
-3
lines changed

clang/lib/AST/Decl.cpp

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3302,8 +3302,7 @@ bool FunctionDecl::isInlineBuiltinDeclaration() const {
33023302

33033303
const FunctionDecl *Definition;
33043304
return hasBody(Definition) && Definition->isInlineSpecified() &&
3305-
Definition->hasAttr<AlwaysInlineAttr>() &&
3306-
Definition->hasAttr<GNUInlineAttr>();
3305+
Definition->hasAttr<AlwaysInlineAttr>();
33073306
}
33083307

33093308
bool FunctionDecl::isDestroyingOperatorDelete() const {

clang/test/CodeGen/memcpy-inline-builtin.c

Lines changed: 63 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3,18 +3,27 @@
33
// RUN: %clang_cc1 -triple x86_64 -S -emit-llvm -o - %s | FileCheck %s
44
//
55
// Verifies that clang detects memcpy inline version and uses it instead of the builtin.
6+
// Checks alternate version with the `artificial` attribute.
67

78
typedef unsigned long size_t;
89

910
// Clang requires these attributes for a function to be redefined.
1011
#define AVAILABLE_EXTERNALLY extern inline __attribute__((always_inline)) __attribute__((gnu_inline))
1112

13+
#define AVAILABLE_EXTERNALLY_ALTERNATE extern inline __attribute__((__always_inline__)) __attribute__((__artificial__))
14+
1215
// Clang recognizes an inline builtin and renames it to prevent conflict with builtins.
1316
AVAILABLE_EXTERNALLY void *memcpy(void *a, const void *b, size_t c) {
1417
asm("# memcpy.inline marker");
1518
return __builtin_memcpy(a, b, c);
1619
}
1720

21+
// Clang recognizes an inline builtin and renames it to prevent conflict with builtins.
22+
AVAILABLE_EXTERNALLY_ALTERNATE void *memmove(void *a, const void *b, size_t c) {
23+
asm("# memmove.inline marker");
24+
return __builtin_memmove(a, b, c);
25+
}
26+
1827
// CHECK-LABEL: @foo(
1928
// CHECK-NEXT: entry:
2029
// CHECK-NEXT: [[A_ADDR_I:%.*]] = alloca ptr, align 8
@@ -43,6 +52,34 @@ void *foo(void *a, const void *b, size_t c) {
4352
return memcpy(a, b, c);
4453
}
4554

55+
// CHECK-LABEL: @foo_alt(
56+
// CHECK-NEXT: entry:
57+
// CHECK-NEXT: [[A_ADDR_I:%.*]] = alloca ptr, align 8
58+
// CHECK-NEXT: [[B_ADDR_I:%.*]] = alloca ptr, align 8
59+
// CHECK-NEXT: [[C_ADDR_I:%.*]] = alloca i64, align 8
60+
// CHECK-NEXT: [[A_ADDR:%.*]] = alloca ptr, align 8
61+
// CHECK-NEXT: [[B_ADDR:%.*]] = alloca ptr, align 8
62+
// CHECK-NEXT: [[C_ADDR:%.*]] = alloca i64, align 8
63+
// CHECK-NEXT: store ptr [[A:%.*]], ptr [[A_ADDR]], align 8
64+
// CHECK-NEXT: store ptr [[B:%.*]], ptr [[B_ADDR]], align 8
65+
// CHECK-NEXT: store i64 [[C:%.*]], ptr [[C_ADDR]], align 8
66+
// CHECK-NEXT: [[TMP0:%.*]] = load ptr, ptr [[A_ADDR]], align 8
67+
// CHECK-NEXT: [[TMP1:%.*]] = load ptr, ptr [[B_ADDR]], align 8
68+
// CHECK-NEXT: [[TMP2:%.*]] = load i64, ptr [[C_ADDR]], align 8
69+
// CHECK-NEXT: store ptr [[TMP0]], ptr [[A_ADDR_I]], align 8
70+
// CHECK-NEXT: store ptr [[TMP1]], ptr [[B_ADDR_I]], align 8
71+
// CHECK-NEXT: store i64 [[TMP2]], ptr [[C_ADDR_I]], align 8
72+
// CHECK-NEXT: call void asm sideeffect "# memmove.inline marker", "~{dirflag},~{fpsr},~{flags}"() #[[ATTR3]], !srcloc !3
73+
// CHECK-NEXT: [[TMP3:%.*]] = load ptr, ptr [[A_ADDR_I]], align 8
74+
// CHECK-NEXT: [[TMP4:%.*]] = load ptr, ptr [[B_ADDR_I]], align 8
75+
// CHECK-NEXT: [[TMP5:%.*]] = load i64, ptr [[C_ADDR_I]], align 8
76+
// CHECK-NEXT: call void @llvm.memmove.p0.p0.i64(ptr align 1 [[TMP3]], ptr align 1 [[TMP4]], i64 [[TMP5]], i1 false)
77+
// CHECK-NEXT: ret ptr [[TMP3]]
78+
//
79+
void *foo_alt(void *a, const void *b, size_t c) {
80+
return memmove(a, b, c);
81+
}
82+
4683
// CHECK-LABEL: @bar(
4784
// CHECK-NEXT: entry:
4885
// CHECK-NEXT: [[A_ADDR:%.*]] = alloca ptr, align 8
@@ -68,3 +105,29 @@ void bar(void *a, const void *b, size_t c) {
68105
void *(*cpy)(void *, const void *, size_t) = c > 10 ? memcpy : foo;
69106
cpy(a, b, c);
70107
}
108+
109+
// CHECK-LABEL: @bar_alt(
110+
// CHECK-NEXT: entry:
111+
// CHECK-NEXT: [[A_ADDR:%.*]] = alloca ptr, align 8
112+
// CHECK-NEXT: [[B_ADDR:%.*]] = alloca ptr, align 8
113+
// CHECK-NEXT: [[C_ADDR:%.*]] = alloca i64, align 8
114+
// CHECK-NEXT: [[CPY:%.*]] = alloca ptr, align 8
115+
// CHECK-NEXT: store ptr [[A:%.*]], ptr [[A_ADDR]], align 8
116+
// CHECK-NEXT: store ptr [[B:%.*]], ptr [[B_ADDR]], align 8
117+
// CHECK-NEXT: store i64 [[C:%.*]], ptr [[C_ADDR]], align 8
118+
// CHECK-NEXT: [[TMP0:%.*]] = load i64, ptr [[C_ADDR]], align 8
119+
// CHECK-NEXT: [[CMP:%.*]] = icmp ugt i64 [[TMP0]], 10
120+
// CHECK-NEXT: [[TMP1:%.*]] = zext i1 [[CMP]] to i64
121+
// CHECK-NEXT: [[COND:%.*]] = select i1 [[CMP]], ptr @memmove, ptr @foo_alt
122+
// CHECK-NEXT: store ptr [[COND]], ptr [[CPY]], align 8
123+
// CHECK-NEXT: [[TMP2:%.*]] = load ptr, ptr [[CPY]], align 8
124+
// CHECK-NEXT: [[TMP3:%.*]] = load ptr, ptr [[A_ADDR]], align 8
125+
// CHECK-NEXT: [[TMP4:%.*]] = load ptr, ptr [[B_ADDR]], align 8
126+
// CHECK-NEXT: [[TMP5:%.*]] = load i64, ptr [[C_ADDR]], align 8
127+
// CHECK-NEXT: [[CALL:%.*]] = call ptr [[TMP2]](ptr noundef [[TMP3]], ptr noundef [[TMP4]], i64 noundef [[TMP5]])
128+
// CHECK-NEXT: ret void
129+
//
130+
void bar_alt(void *a, const void *b, size_t c) {
131+
void *(*cpy)(void *, const void *, size_t) = c > 10 ? memmove : foo_alt;
132+
cpy(a, b, c);
133+
}

clang/test/CodeGen/pr9614.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ void f(void) {
3232

3333
// CHECK-LABEL: define{{.*}} void @f()
3434
// CHECK: call void @foo()
35-
// CHECK: call i32 @abs(i32 noundef 0)
35+
// CHECK: call i32 @abs(i32 noundef %0)
3636
// CHECK: call ptr @strrchr(
3737
// CHECK: call void @llvm.prefetch.p0(
3838
// CHECK: call ptr @memchr(

0 commit comments

Comments
 (0)