Skip to content

Commit 52c36ba

Browse files
committed
src: gpu: intel: fix implicit conversion warnings
1 parent 4929363 commit 52c36ba

3 files changed

Lines changed: 15 additions & 15 deletions

File tree

src/gpu/intel/dynamic_scale.cl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ __kernel void dynamic_scale_dst(__global float *restrict src,
4646
long c_stride_n) {
4747
long m = get_global_id(0);
4848
long n = get_global_id(1);
49-
int mb = get_global_id(2);
49+
long mb = get_global_id(2);
5050
// decompose mb into batch dimensions (d0..d3)
5151
long d3 = mb / D0 / D1 / D2;
5252
long d2 = (mb / D0 / D1) % D2;

src/gpu/intel/graph/gen_index.cl

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,8 @@
1616

1717
__kernel void gen_index(__global int *dst, int axis) {
1818
long id = get_global_id(0);
19-
long result, offset = 0;
20-
long idx;
19+
int result, offset = 0;
20+
int idx;
2121

2222
idx = id % D0;
2323
id = id / D0;

src/gpu/intel/zeropad/simple.cl

Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -21,10 +21,10 @@
2121
static inline void typed_simple_zero_pad(__global void *a, ulong type_size,
2222
ulong step_nelems, ulong nelems_block, ulong step_block, ulong nsteps,
2323
ulong step_size, zero_pad_mask_t step_bitmask, ulong mode) {
24-
const int i0 = get_global_id(0);
25-
const int istep = get_global_id(1) * step_block;
26-
const int iblock = get_global_id(2);
27-
int offset = iblock * step_size + (step_size - nsteps * step_nelems)
24+
const ulong i0 = get_global_id(0);
25+
const ulong istep = get_global_id(1) * step_block;
26+
const ulong iblock = get_global_id(2);
27+
ulong offset = iblock * step_size + (step_size - nsteps * step_nelems)
2828
+ istep * step_nelems;
2929

3030
const int step = ZERO_PAD_MASK_DT_BITS;
@@ -46,7 +46,7 @@ static inline void typed_simple_zero_pad(__global void *a, ulong type_size,
4646

4747
for (int k = 0; k < step_block; k++) {
4848
__attribute__((opencl_unroll_hint)) // attr:no-format
49-
for (int i = i0; i < step_nelems; i += nelems_block) {
49+
for (ulong i = i0; i < step_nelems; i += nelems_block) {
5050
if (step_bitmask.mask[i / step] & (1 << (i % step))) {
5151
switch (type_size) {
5252
case 8: a8[offset + i] = 0; break;
@@ -137,16 +137,16 @@ simple_zero_pad_subg_16(__global char *a, const uint type_size,
137137
const ulong d1_stride, const ulong d2_stride, const ulong d3_stride,
138138
const unsigned d0_size, const unsigned d1_size, const unsigned d2_size,
139139
const unsigned d3_size, const uint b_multiplier) {
140-
const unsigned a_block_id = get_global_id(0) / 16;
141-
const unsigned b_block_id = get_global_id(1);
142-
unsigned mixed_dims = get_global_id(2);
140+
const ulong a_block_id = get_global_id(0) / 16;
141+
const ulong b_block_id = get_global_id(1);
142+
ulong mixed_dims = get_global_id(2);
143143

144-
const unsigned d3_dim = mixed_dims % d3_size;
144+
const ulong d3_dim = mixed_dims % d3_size;
145145
mixed_dims /= d3_size;
146-
const unsigned d2_dim = mixed_dims % d2_size;
146+
const ulong d2_dim = mixed_dims % d2_size;
147147
mixed_dims /= d2_size;
148-
const unsigned d1_dim = mixed_dims % d1_size;
149-
const unsigned d0_dim = mixed_dims / d1_size;
148+
const ulong d1_dim = mixed_dims % d1_size;
149+
const ulong d0_dim = mixed_dims / d1_size;
150150

151151
__global char *p = a + base_offset;
152152
p += a_block_id * b_block_size;

0 commit comments

Comments
 (0)