10 | const float* __restrict__ weight,
| ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
11 | const float* __restrict__ bias,
| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:10:31: note: the first parameter in the range is 'weight'
10 | const float* __restrict__ weight,
| ^~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:11:31: note: the last parameter in the range is 'bias'
11 | const float* __restrict__ bias,
| ^~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:13:5: warning: 2 adjacent parameters of 'convTranspose2dCoalescedKernel' of similar type ('int') are easily swapped by mistake [bugprone-easily-swappable-parameters]
13 | int batch,
| ^~~~~~~~~~
14 | int in_channels,
| ~~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:13:9: note: the first parameter in the range is 'batch'
13 | int batch,
| ^~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:14:9: note: the last parameter in the range is 'in_channels'
14 | int in_channels,
| ^~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:15:5: warning: 2 adjacent parameters of 'convTranspose2dCoalescedKernel' of similar type ('int') are easily swapped by mistake [bugprone-easily-swappable-parameters]
15 | int out_channels,
| ^~~~~~~~~~~~~~~~~
16 | int height_in,
| ~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:15:9: note: the first parameter in the range is 'out_channels'
15 | int out_channels,
| ^~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:16:9: note: the last parameter in the range is 'height_in'
16 | int height_in,
| ^~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:17:5: warning: 2 adjacent parameters of 'convTranspose2dCoalescedKernel' of similar type ('int') are easily swapped by mistake [bugprone-easily-swappable-parameters]
17 | int width_in,
| ^~~~~~~~~~~~~
18 | int kernel_size,
| ~~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:17:9: note: the first parameter in the range is 'width_in'
17 | int width_in,
| ^~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:18:9: note: the last parameter in the range is 'kernel_size'
18 | int kernel_size,
| ^~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:19:5: warning: 3 adjacent parameters of 'convTranspose2dCoalescedKernel' of similar type ('int') are easily swapped by mistake [bugprone-easily-swappable-parameters]
19 | int stride,
| ^~~~~~~~~~~
20 | int padding,
| ~~~~~~~~~~~~
21 | int height_out,
| ~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:19:9: note: the first parameter in the range is 'stride'
19 | int stride,
| ^~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:21:9: note: the last parameter in the range is 'height_out'
21 | int height_out,
| ^~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:22:5: warning: 2 adjacent parameters of 'convTranspose2dCoalescedKernel' of similar type ('int') are easily swapped by mistake [bugprone-easily-swappable-parameters]
22 | int width_out,
| ^~~~~~~~~~~~~~
23 | int groups,
| ~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:22:9: note: the first parameter in the range is 'width_out'
22 | int width_out,
| ^~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:23:9: note: the last parameter in the range is 'groups'
23 | int groups,
| ^~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:26:15: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
26 | int idx = blockIdx.x * blockDim.x + threadIdx.x;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:85:19: warning: the parameter 'x' is copied for each invocation but only used as a const reference; consider making it a const reference [performance-unnecessary-value-param]
85 | torch::Tensor x,
| ^
| const &
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:86:19: warning: the parameter 'weight' is copied for each invocation but only used as a const reference; consider making it a const reference [performance-unnecessary-value-param]
86 | torch::Tensor weight,
| ^
| const &
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:90:5: warning: 2 adjacent parameters of 'conv_transpose2d_forward' of similar type ('int64_t') are easily swapped by mistake [bugprone-easily-swappable-parameters]
90 | int64_t output_padding,
| ^~~~~~~~~~~~~~~~~~~~~~~
91 | int64_t groups
| ~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:90:13: note: the first parameter in the range is 'output_padding'
90 | int64_t output_padding,
| ^~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:91:13: note: the last parameter in the range is 'groups'
91 | int64_t groups
| ^~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:96:17: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
96 | int batch = x.size(0);
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:97:23: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
97 | int in_channels = x.size(1);
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:98:21: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
98 | int height_in = x.size(2);
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:99:20: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
99 | int width_in = x.size(3);
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:100:23: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
100 | int kernel_size = weight.size(2);
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:101:24: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
101 | int out_channels = weight.size(1) * groups;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:103:22: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
103 | int height_out = (height_in - 1) * stride - 2 * padding + kernel_size + output_padding;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:104:21: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
104 | int width_out = (width_in - 1) * stride - 2 * padding + kernel_size + output_padding;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:119:22: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
119 | kernel_size, stride, padding,
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:119:30: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
119 | kernel_size, stride, padding,
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250211_optimize_b5_s4_e1_v2/level_1/task_57/b4_s3_conv_transposed2d_coalesced/base/base.cu:121:9: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
121 | groups, bias.has_value()
| ^