File tree Expand file tree Collapse file tree 4 files changed +4
-5
lines changed Expand file tree Collapse file tree 4 files changed +4
-5
lines changed Original file line number Diff line number Diff line change @@ -136,9 +136,9 @@ void print_header() {
136
136
void Benchmark::run_benchmarks () {
137
137
uint64_t id = gpu::get_thread_id ();
138
138
139
- if (id == 0 ) {
139
+ if (id == 0 )
140
140
print_header ();
141
- }
141
+
142
142
gpu::sync_threads ();
143
143
144
144
for (Benchmark *b : benchmarks) {
Original file line number Diff line number Diff line change @@ -27,6 +27,7 @@ add_benchmark(
27
27
COMPILE_OPTIONS
28
28
${nvptx_math_found}
29
29
${nvptx_bitcode_link_flags}
30
+ -save-temps
30
31
LOADER_ARGS
31
32
--threads 64
32
33
)
Original file line number Diff line number Diff line change @@ -17,8 +17,6 @@ uint64_t get_bits(double x) {
17
17
return LIBC_NAMESPACE::cpp::bit_cast<uint64_t >(x);
18
18
}
19
19
20
- constexpr int RANDOM_INPUT_SIZE = 256 ;
21
-
22
20
// BENCHMARK() expects a function that with no parameters that returns a
23
21
// uint64_t representing the latency. Defining each benchmark using macro that
24
22
// expands to a lambda to allow us to switch the implementation of `sin()` to
Original file line number Diff line number Diff line change @@ -230,7 +230,7 @@ endfunction()
230
230
function (_get_hermetic_test_compile_options output_var flags )
231
231
_get_compile_options_from_flags (compile_flags ${flags} )
232
232
list (APPEND compile_options ${LIBC_COMPILE_OPTIONS_DEFAULT} ${compile_flags}
233
- ${flags} -fpie -ffreestanding -fno-exceptions -fno-rtti )
233
+ ${flags} -fpie -ffreestanding -fno-exceptions -fno-rtti -save-temps )
234
234
235
235
# The GPU build requires overriding the default CMake triple and architecture.
236
236
if (LIBC_TARGET_ARCHITECTURE_IS_AMDGPU )
You can’t perform that action at this time.
0 commit comments