15 | const float* __restrict__ anchor,
| ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
16 | const float* __restrict__ positive,
| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
17 | const float* __restrict__ negative,
| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:15:31: note: the first parameter in the range is 'anchor'
15 | const float* __restrict__ anchor,
| ^~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:17:31: note: the last parameter in the range is 'negative'
17 | const float* __restrict__ negative,
| ^~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:19:5: warning: 3 adjacent parameters of 'triplet_margin_loss_kernel_optimized' of convertible types are easily swapped by mistake [bugprone-easily-swappable-parameters]
19 | const float margin,
| ^~~~~~~~~~~~~~~~~~~
20 | const int batch_size,
| ~~~~~~~~~~~~~~~~~~~~~
21 | const int feat_size) {
| ~~~~~~~~~~~~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:19:17: note: the first parameter in the range is 'margin'
19 | const float margin,
| ^~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:21:15: note: the last parameter in the range is 'feat_size'
21 | const int feat_size) {
| ^~~~~~~~~
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:20:5: note: 'const float' and 'const int' may be implicitly converted: 'const float' (as 'float') -> 'const int' (as 'int'), 'const int' (as 'int') -> 'const float' (as 'float')
20 | const int batch_size,
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:23:27: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
23 | const int batch_idx = blockIdx.x;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:31:25: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
31 | const int lane_id = threadIdx.x % 32;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:32:25: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
32 | const int warp_id = threadIdx.x / 32;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:33:27: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
33 | const int num_warps = blockDim.x / 32;
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:47:18: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
47 | for (int i = threadIdx.x; i < vec_elements; i += blockDim.x) {
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:47:54: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
47 | for (int i = threadIdx.x; i < vec_elements; i += blockDim.x) {
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:79:18: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
79 | for (int i = vec_elements * 4 + threadIdx.x; i < feat_size; i += blockDim.x) {
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:79:70: warning: narrowing conversion from 'unsigned int' to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
79 | for (int i = vec_elements * 4 + threadIdx.x; i < feat_size; i += blockDim.x) {
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:118:19: warning: the parameter 'anchor' is copied for each invocation but only used as a const reference; consider making it a const reference [performance-unnecessary-value-param]
118 | torch::Tensor anchor,
| ^
| const &
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:119:19: warning: the parameter 'positive' is copied for each invocation but only used as a const reference; consider making it a const reference [performance-unnecessary-value-param]
119 | torch::Tensor positive,
| ^
| const &
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:120:19: warning: the parameter 'negative' is copied for each invocation but only used as a const reference; consider making it a const reference [performance-unnecessary-value-param]
120 | torch::Tensor negative,
| ^
| const &
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:127:28: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
127 | const int batch_size = anchor.size(0);
| ^
/home/robert_sakana_ai/llm_cuda/experiments/20250208_optimize_b5_s4_e1_sweep/level_1/task_99/b3_s2_warp_optimized_tripletloss/base/base.cu:128:27: warning: narrowing conversion from 'int64_t' (aka 'long') to signed type 'int' is implementation-defined [bugprone-narrowing-conversions]
128 | const int feat_size = anchor.size(1);
| ^