11 | int idx = blockIdx.x * blockDim.x + threadIdx.x;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:12:18: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
12 | int stride = gridDim.x * blockDim.x;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:21:47: warning: 2 adjacent parameters of 'max_pool2d_kernel' of similar type ('int') are easily swapped by mistake [bugprone-easily-swappable-parameters]
21 | int batch_size, int channels, int height, int width,
| ^~~~~~~~~~
22 | int pool_height, int pool_width, int stride
| ~~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:21:51: note: the first parameter in the range is 'width'
21 | int batch_size, int channels, int height, int width,
| ^~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:22:9: note: the last parameter in the range is 'pool_height'
22 | int pool_height, int pool_width, int stride
| ^~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:27:15: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
27 | int idx = blockIdx.x * blockDim.x + threadIdx.x;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:28:26: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
28 | int stride_threads = blockDim.x * gridDim.x;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:53:5: warning: 2 adjacent parameters of 'linear_kernel' of similar type ('const float *__restrict') are easily swapped by mistake [bugprone-easily-swappable-parameters]
53 | const float* __restrict__ weight,
| ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
54 | const float* __restrict__ bias,
| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:53:31: note: the first parameter in the range is 'weight'
53 | const float* __restrict__ weight,
| ^~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:54:31: note: the last parameter in the range is 'bias'
54 | const float* __restrict__ bias,
| ^~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:56:5: warning: 2 adjacent parameters of 'linear_kernel' of similar type ('int') are easily swapped by mistake [bugprone-easily-swappable-parameters]
56 | int in_features, int out_features
| ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:56:9: note: the first parameter in the range is 'in_features'
56 | int in_features, int out_features
| ^~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:56:26: note: the last parameter in the range is 'out_features'
56 | int in_features, int out_features
| ^~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:58:15: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
58 | int idx = blockIdx.x * blockDim.x + threadIdx.x;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:59:18: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
59 | int stride = blockDim.x * gridDim.x;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:93:28: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
93 | const int num_blocks = (x.numel() + block_size - 1) / block_size;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:97:70: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
97 | relu_kernel<<<num_blocks, block_size>>>(conv1.data_ptr<float>(), conv1.numel());
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:102:70: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
102 | relu_kernel<<<num_blocks, block_size>>>(conv2.data_ptr<float>(), conv2.numel());
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:110:68: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
110 | relu_kernel<<<num_blocks, block_size>>>(fc1.data_ptr<float>(), fc1.numel());
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250203_optimize_b10_s4_e0_sweep/level_3/task_4/b10_s2_balanced_workload_distribution/base/base.cu:114:68: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
114 | relu_kernel<<<num_blocks, block_size>>>(fc2.data_ptr<float>(), fc2.numel());
| ^