@@ -230,7 +230,7 @@ typedef float fp32;
230
230
int x) { \
231
231
struct out_##pixelf_size res = \
232
232
__nvvm_suld_1d_v4i##pixelf_size##_##cuda_address_mode##_s( \
233
- image, x * sizeof(struct out_## pixelf_size)); \
233
+ image, x * pixelf_size * 4); \
234
234
return out_pixelf##pixelf_size(res); \
235
235
}
236
236
@@ -239,7 +239,7 @@ typedef float fp32;
239
239
long image, int x, int y) { \
240
240
struct out_##pixelf_size res = \
241
241
__nvvm_suld_2d_v4i##pixelf_size##_##cuda_address_mode##_s( \
242
- image, x * sizeof(struct out_## pixelf_size) , y); \
242
+ image, x * pixelf_size * 4 , y); \
243
243
return out_pixelf##pixelf_size(res); \
244
244
}
245
245
@@ -248,7 +248,7 @@ typedef float fp32;
248
248
long image, int x, int y, int z) { \
249
249
struct out_##pixelf_size res = \
250
250
__nvvm_suld_3d_v4i##pixelf_size##_##cuda_address_mode##_s( \
251
- image, x * sizeof(struct out_## pixelf_size) , y, z); \
251
+ image, x * pixelf_size * 4 , y, z); \
252
252
return out_pixelf##pixelf_size(res); \
253
253
}
254
254
0 commit comments