-
Notifications
You must be signed in to change notification settings - Fork 14.3k
[transforms] Inline simple variadic functions #81058
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Closed
JonChesterfield
wants to merge
1
commit into
llvm:main
from
JonChesterfield:jc_varargs_inliner_component
Closed
Changes from all commits
Commits
File filter
Filter by extension
Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
There are no files selected for viewing
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,273 @@ | ||
// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py | ||
|
||
// REQUIRES: x86-registered-target | ||
// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -target-cpu x86-64-v4 -std=c23 -O1 -ffreestanding -emit-llvm -o - %s | FileCheck %s | ||
|
||
// This test sanity checks calling a variadic function with the expansion transform disabled. | ||
// The IR test cases {arch}/expand-variadic-call-*.ll correspond to IR generated from this test case. | ||
|
||
typedef __builtin_va_list va_list; | ||
#define va_copy(dest, src) __builtin_va_copy(dest, src) | ||
#define va_start(ap, ...) __builtin_va_start(ap, 0) | ||
#define va_end(ap) __builtin_va_end(ap) | ||
#define va_arg(ap, type) __builtin_va_arg(ap, type) | ||
|
||
// 32 bit x86 alignment uses getTypeStackAlign for special cases | ||
// Whitebox testing. | ||
// Needs a type >= 16 which is either a simd or a struct containing a simd | ||
// darwinvectorabi should force 4 bytes | ||
// linux vectors with align 16/32/64 return that alignment | ||
|
||
|
||
void wrapped(va_list); | ||
|
||
// CHECK-LABEL: @codegen_for_copy( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[CP:%.*]] = alloca [1 x %struct.__va_list_tag], align 16 | ||
// CHECK-NEXT: call void @llvm.lifetime.start.p0(i64 24, ptr nonnull [[CP]]) #[[ATTR7:[0-9]+]] | ||
// CHECK-NEXT: call void @llvm.va_copy(ptr nonnull [[CP]], ptr [[X:%.*]]) | ||
// CHECK-NEXT: call void @wrapped(ptr noundef nonnull [[CP]]) #[[ATTR8:[0-9]+]] | ||
// CHECK-NEXT: call void @llvm.va_end(ptr [[CP]]) | ||
// CHECK-NEXT: call void @llvm.lifetime.end.p0(i64 24, ptr nonnull [[CP]]) #[[ATTR7]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void codegen_for_copy(va_list x) | ||
{ | ||
va_list cp; | ||
va_copy(cp, x); | ||
wrapped(cp); | ||
va_end(cp); | ||
} | ||
|
||
|
||
// CHECK-LABEL: @vararg( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[VA:%.*]] = alloca [1 x %struct.__va_list_tag], align 16 | ||
// CHECK-NEXT: call void @llvm.lifetime.start.p0(i64 24, ptr nonnull [[VA]]) #[[ATTR7]] | ||
// CHECK-NEXT: call void @llvm.va_start(ptr nonnull [[VA]]) | ||
// CHECK-NEXT: call void @wrapped(ptr noundef nonnull [[VA]]) #[[ATTR8]] | ||
// CHECK-NEXT: call void @llvm.va_end(ptr [[VA]]) | ||
// CHECK-NEXT: call void @llvm.lifetime.end.p0(i64 24, ptr nonnull [[VA]]) #[[ATTR7]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void vararg(...) | ||
{ | ||
va_list va; | ||
__builtin_va_start(va, 0); | ||
wrapped(va); | ||
va_end(va); | ||
} | ||
|
||
// vectors with alignment 16/32/64 are natively aligned on linux x86 | ||
// v32f32 would be a m1024 type, larger than x64 defines at time of writing | ||
typedef int i32; | ||
typedef float v4f32 __attribute__((__vector_size__(16), __aligned__(16))); | ||
typedef float v8f32 __attribute__((__vector_size__(32), __aligned__(32))); | ||
typedef float v16f32 __attribute__((__vector_size__(64), __aligned__(64))); | ||
typedef float v32f32 __attribute__((__vector_size__(128), __aligned__(128))); | ||
|
||
|
||
// Pass a single value to wrapped() via vararg(...) | ||
// CHECK-LABEL: @single_i32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(i32 noundef [[X:%.*]]) #[[ATTR9:[0-9]+]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void single_i32(i32 x) | ||
{ | ||
vararg(x); | ||
} | ||
|
||
// CHECK-LABEL: @single_double( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(double noundef [[X:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void single_double(double x) | ||
{ | ||
vararg(x); | ||
} | ||
|
||
// CHECK-LABEL: @single_v4f32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(<4 x float> noundef [[X:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void single_v4f32(v4f32 x) | ||
{ | ||
vararg(x); | ||
} | ||
|
||
// CHECK-LABEL: @single_v8f32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(<8 x float> noundef [[X:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void single_v8f32(v8f32 x) | ||
{ | ||
vararg(x); | ||
} | ||
|
||
// CHECK-LABEL: @single_v16f32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(<16 x float> noundef [[X:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void single_v16f32(v16f32 x) | ||
{ | ||
vararg(x); | ||
} | ||
|
||
// CHECK-LABEL: @single_v32f32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[INDIRECT_ARG_TEMP:%.*]] = alloca <32 x float>, align 128 | ||
// CHECK-NEXT: [[X:%.*]] = load <32 x float>, ptr [[TMP0:%.*]], align 128, !tbaa [[TBAA2:![0-9]+]] | ||
// CHECK-NEXT: store <32 x float> [[X]], ptr [[INDIRECT_ARG_TEMP]], align 128, !tbaa [[TBAA2]] | ||
// CHECK-NEXT: tail call void (...) @vararg(ptr noundef nonnull byval(<32 x float>) align 128 [[INDIRECT_ARG_TEMP]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void single_v32f32(v32f32 x) | ||
{ | ||
vararg(x); | ||
} | ||
|
||
|
||
|
||
// CHECK-LABEL: @i32_double( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(i32 noundef [[X:%.*]], double noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void i32_double(i32 x, double y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @double_i32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(double noundef [[X:%.*]], i32 noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void double_i32(double x, i32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
|
||
// A struct used by libc variadic tests | ||
|
||
typedef struct { | ||
char c; | ||
short s; | ||
int i; | ||
long l; | ||
float f; | ||
double d; | ||
} libcS; | ||
|
||
// CHECK-LABEL: @i32_libcS( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(i32 noundef [[X:%.*]], ptr noundef nonnull byval([[STRUCT_LIBCS:%.*]]) align 8 [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void i32_libcS(i32 x, libcS y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @libcS_i32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(ptr noundef nonnull byval([[STRUCT_LIBCS:%.*]]) align 8 [[X:%.*]], i32 noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void libcS_i32(libcS x, i32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
|
||
// CHECK-LABEL: @i32_v4f32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(i32 noundef [[X:%.*]], <4 x float> noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void i32_v4f32(i32 x, v4f32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @v4f32_i32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(<4 x float> noundef [[X:%.*]], i32 noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void v4f32_i32(v4f32 x, i32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @i32_v8f32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(i32 noundef [[X:%.*]], <8 x float> noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void i32_v8f32(i32 x, v8f32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @v8f32_i32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(<8 x float> noundef [[X:%.*]], i32 noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void v8f32_i32(v8f32 x, i32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @i32_v16f32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(i32 noundef [[X:%.*]], <16 x float> noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void i32_v16f32(i32 x, v16f32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @v16f32_i32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: tail call void (...) @vararg(<16 x float> noundef [[X:%.*]], i32 noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void v16f32_i32(v16f32 x, i32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @i32_v32f32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[INDIRECT_ARG_TEMP:%.*]] = alloca <32 x float>, align 128 | ||
// CHECK-NEXT: [[Y:%.*]] = load <32 x float>, ptr [[TMP0:%.*]], align 128, !tbaa [[TBAA2]] | ||
// CHECK-NEXT: store <32 x float> [[Y]], ptr [[INDIRECT_ARG_TEMP]], align 128, !tbaa [[TBAA2]] | ||
// CHECK-NEXT: tail call void (...) @vararg(i32 noundef [[X:%.*]], ptr noundef nonnull byval(<32 x float>) align 128 [[INDIRECT_ARG_TEMP]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void i32_v32f32(i32 x, v32f32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
|
||
// CHECK-LABEL: @v32f32_i32( | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[INDIRECT_ARG_TEMP:%.*]] = alloca <32 x float>, align 128 | ||
// CHECK-NEXT: [[X:%.*]] = load <32 x float>, ptr [[TMP0:%.*]], align 128, !tbaa [[TBAA2]] | ||
// CHECK-NEXT: store <32 x float> [[X]], ptr [[INDIRECT_ARG_TEMP]], align 128, !tbaa [[TBAA2]] | ||
// CHECK-NEXT: tail call void (...) @vararg(ptr noundef nonnull byval(<32 x float>) align 128 [[INDIRECT_ARG_TEMP]], i32 noundef [[Y:%.*]]) #[[ATTR9]] | ||
// CHECK-NEXT: ret void | ||
// | ||
void v32f32_i32(v32f32 x, i32 y) | ||
{ | ||
vararg(x, y); | ||
} | ||
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,86 @@ | ||
// REQUIRES: x86-registered-target | ||
// RUN: %clang_cc1 -triple i386-unknown-linux-gnu -O1 -emit-llvm -o - %s | opt --passes=expand-variadics -S | FileCheck %s | ||
// RUN: %clang_cc1 -triple=x86_64-linux-gnu -O1 -emit-llvm -o - %s | opt --passes=expand-variadics -S | FileCheck %s | ||
|
||
// neither arm arch is implemented yet, leaving it here as a reminder | ||
// armv6 is a ptr as far as the struct is concerned, but possibly also a [1 x i32] passed by value | ||
// that seems insistent, maybe leave 32 bit arm alone for now | ||
// aarch64 is a struct of five things passed using byval memcpy | ||
|
||
// R-N: %clang_cc1 -triple=armv6-none--eabi -O1 -emit-llvm -o - %s | opt --passes=expand-variadics -S | FileCheck %s | ||
|
||
// R-N: %clang_cc1 -triple=aarch64-none-linux-gnu -O1 -emit-llvm -o - %s | opt --passes=expand-variadics -S | FileCheck %s | ||
|
||
|
||
|
||
// expand-variadics rewrites calls to variadic functions into calls to | ||
// equivalent functions that take a va_list argument. A property of the | ||
// implementation is that said "equivalent function" may be a pre-existing one. | ||
// This is equivalent to inlining a sufficiently simple variadic wrapper. | ||
|
||
#include <stdarg.h> | ||
|
||
typedef int FILE; // close enough for this test | ||
|
||
// fprintf is sometimes implemented as a call to vfprintf. That fits the | ||
// pattern the transform pass recognises - given an implementation of fprintf | ||
// in the IR module, calls to it can be rewritten into calls into vfprintf. | ||
|
||
// CHECK-LABEL: define{{.*}} i32 @fprintf( | ||
// CHECK-LABEL: define{{.*}} i32 @call_fprintf( | ||
// CHECK-NOT: @fprintf | ||
// CHECK: @vfprintf | ||
int vfprintf(FILE *restrict f, const char *restrict fmt, va_list ap); | ||
int fprintf(FILE *restrict f, const char *restrict fmt, ...) | ||
{ | ||
int ret; | ||
va_list ap; | ||
va_start(ap, fmt); | ||
ret = vfprintf(f, fmt, ap); | ||
va_end(ap); | ||
return ret; | ||
} | ||
int call_fprintf(FILE *f) | ||
{ | ||
int x = 42; | ||
double y = 3.14; | ||
return fprintf(f, "int %d dbl %g\n", x, y); | ||
} | ||
|
||
// Void return type is also OK | ||
|
||
// CHECK-LABEL: define{{.*}} void @no_result( | ||
// CHECK-LABEL: define{{.*}} void @call_no_result( | ||
// CHECK-NOT: @no_result | ||
// CHECK: @vno_result | ||
void vno_result(const char * fmt, va_list); | ||
void no_result(const char * fmt, ...) | ||
{ | ||
va_list ap; | ||
va_start(ap, fmt); | ||
vno_result(fmt, ap); | ||
va_end(ap); | ||
} | ||
void call_no_result(FILE *f) | ||
{ | ||
int x = 101; | ||
no_result("", x); | ||
} | ||
|
||
// The vaend in the forwarding implementation is optional where it's a no-op | ||
|
||
// CHECK-LABEL: define{{.*}} i32 @no_vaend( | ||
// CHECK-LABEL: define{{.*}} i32 @call_no_vaend( | ||
// CHECK-NOT: @no_vaend | ||
// CHECK: @vno_vaend | ||
int vno_vaend(int x, va_list); | ||
int no_vaend(int x, ...) | ||
{ | ||
va_list ap; | ||
va_start(ap, x); | ||
return vno_vaend(x, ap); | ||
} | ||
int call_no_vaend(int x) | ||
{ | ||
return no_vaend(x, 10, 2.5f); | ||
} |
Oops, something went wrong.
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
also get the half and bfloat cases