|
4 | 4 | from cuda.core.experimental._module import ObjectCode
|
5 | 5 |
|
6 | 6 | ARCH = "sm_80" # use sm_80 for testing the oop nvJitLink wrapper
|
7 |
| -empty_entrypoint_kernel = "__global__ void A() {}" |
8 |
| -empty_kernel = "__device__ void B() {}" |
| 7 | +empty_kernel = "__device__ void A() {}" |
| 8 | +basic_kernel = "__device__ int B() { return 0; }" |
9 | 9 | addition_kernel = "__device__ int C(int a, int b) { return a + b; }"
|
10 | 10 |
|
11 | 11 |
|
12 | 12 | @pytest.fixture(scope="function")
|
13 | 13 | def compile_ptx_functions(init_cuda):
|
14 |
| - object_code_a_ptx = Program(empty_entrypoint_kernel, "c++").compile("ptx") |
15 |
| - object_code_b_ptx = Program(empty_kernel, "c++").compile("ptx") |
| 14 | + object_code_a_ptx = Program(empty_kernel, "c++").compile("ptx") |
| 15 | + object_code_b_ptx = Program(basic_kernel, "c++").compile("ptx") |
16 | 16 | object_code_c_ptx = Program(addition_kernel, "c++").compile("ptx")
|
17 | 17 |
|
18 | 18 | return object_code_a_ptx, object_code_b_ptx, object_code_c_ptx
|
19 | 19 |
|
20 | 20 |
|
21 | 21 | @pytest.fixture(scope="function")
|
22 | 22 | def compile_ltoir_functions(init_cuda):
|
23 |
| - object_code_a_ltoir = Program(empty_entrypoint_kernel, "c++").compile("ltoir", options=("-dlto",)) |
24 |
| - object_code_b_ltoir = Program(empty_kernel, "c++").compile("ltoir", options=("-dlto",)) |
| 23 | + object_code_a_ltoir = Program(empty_kernel, "c++").compile("ltoir", options=("-dlto",)) |
| 24 | + object_code_b_ltoir = Program(basic_kernel, "c++").compile("ltoir", options=("-dlto",)) |
25 | 25 | object_code_c_ltoir = Program(addition_kernel, "c++").compile("ltoir", options=("-dlto",))
|
26 | 26 |
|
27 | 27 | return object_code_a_ltoir, object_code_b_ltoir, object_code_c_ltoir
|
|
0 commit comments