BEGIN 1782125667.8080735 EXEC /__w/rockrel/rockrel/build/ml-libs/composable_kernel/build /usr/local/therock-tools/bin/cmake -E env --unset=ROCM_PATH --unset=ROCM_DIR --unset=HIP_PATH --unset=HIP_DIR -- /usr/local/therock-tools/bin/cmake --build /__w/rockrel/rockrel/build/ml-libs/composable_kernel/build 73.8 [1/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_f64_kknn_instance.cpp.o 74.6 [2/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_f64_compute_f32_kknn_instance.cpp.o 78.9 [3/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_f64_mnnn_instance.cpp.o 79.9 [4/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_f64_compute_f32_mnnn_instance.cpp.o 80.9 [5/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_f64_compute_f32_mknn_instance.cpp.o 81.0 [6/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_f64_compute_f32_knnn_instance.cpp.o 81.7 [7/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_f64_mknn_instance.cpp.o 86.7 [8/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_f64_knnn_instance.cpp.o 100.7 [9/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_compute_f16_kknn_instance.cpp.o 103.1 [10/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_kknn_instance.cpp.o 106.4 [11/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_f64_compute_f32_kknn_instance.cpp.o 107.2 [12/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_f16_kknn_instance.cpp.o 110.3 [13/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_f16_compute_f32_kknn_instance.cpp.o 110.9 [14/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_f64_mnnn_instance.cpp.o 113.6 [15/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_f64_kknn_instance.cpp.o 115.4 [16/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_f64_compute_f32_mnnn_instance.cpp.o 118.4 [17/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_f64_compute_f32_knnn_instance.cpp.o 119.0 [18/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_f64_mknn_instance.cpp.o 120.4 [19/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_f64_compute_f32_mknn_instance.cpp.o 123.6 [20/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_bf16_kknn_instance.cpp.o 124.6 [21/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_f64_knnn_instance.cpp.o 124.7 [22/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_compute_bf16_kknn_instance.cpp.o 133.8 [23/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_bf16_compute_f32_kknn_instance.cpp.o 143.4 [24/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_compute_f16_mnnn_instance.cpp.o 157.5 [25/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_mnnn_instance.cpp.o 157.6 [26/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_kknn_instance.cpp.o 157.8 [27/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_compute_bf16_mnnn_instance.cpp.o 158.8 [28/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_f16_mnnn_instance.cpp.o 161.9 [29/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_f16_compute_f32_mnnn_instance.cpp.o 162.9 [30/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_f16_compute_f32_kknn_instance.cpp.o 164.7 [31/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_compute_f16_knnn_instance.cpp.o 166.3 [32/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_mknn_instance.cpp.o 166.7 [33/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_f16_compute_f32_knnn_instance.cpp.o 167.1 [34/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_f16_mknn_instance.cpp.o 167.7 [35/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_compute_f16_mknn_instance.cpp.o 167.9 [36/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_knnn_instance.cpp.o 168.4 [37/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_f16_kknn_instance.cpp.o 170.7 [38/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_f16_knnn_instance.cpp.o 171.8 [39/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_f16_compute_f32_mknn_instance.cpp.o 172.5 [40/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_compute_bf16_mknn_instance.cpp.o 173.6 [41/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_f32_compute_bf16_knnn_instance.cpp.o 175.0 [42/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_bf16_compute_f32_knnn_instance.cpp.o 175.6 [43/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_compute_bf16_kknn_instance.cpp.o 177.2 [44/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_bf16_mknn_instance.cpp.o 178.2 [45/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_compute_f16_kknn_instance.cpp.o 178.9 [46/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_bf16_knnn_instance.cpp.o 179.9 [47/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_bf16_mnnn_instance.cpp.o 182.6 [48/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_bf16_compute_f32_mknn_instance.cpp.o 183.6 [49/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/2D/device_contraction_bilinear_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_bf16_compute_f32_mnnn_instance.cpp.o 185.8 [50/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_bf16_kknn_instance.cpp.o 200.7 [51/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_compute_f16_mnnn_instance.cpp.o 204.1 [52/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_mknn_instance.cpp.o 206.2 [53/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_knnn_instance.cpp.o 206.4 [54/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_f16_mnnn_instance.cpp.o 207.5 [55/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_mnnn_instance.cpp.o 208.3 [56/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_kkn_instance.cpp.o 208.8 [57/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_f16_mknn_instance.cpp.o 208.9 [58/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_f16_compute_f32_mnnn_instance.cpp.o 209.5 [59/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_f16_compute_f32_mknn_instance.cpp.o 210.4 [60/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_mnn_instance.cpp.o 210.9 [61/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_f16_knnn_instance.cpp.o 211.5 [62/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_compute_f16_knnn_instance.cpp.o 212.3 [63/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_kkn_instance.cpp.o 212.9 [64/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_compute_f16_mknn_instance.cpp.o 213.7 [65/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_compute_bf16_mknn_instance.cpp.o 213.9 [66/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_f16_compute_f32_knnn_instance.cpp.o 215.1 [67/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_compute_bf16_mnnn_instance.cpp.o 216.0 [68/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_mkn_instance.cpp.o 217.4 [69/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_knn_instance.cpp.o 220.9 [70/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_compute_f32_kkn_instance.cpp.o 223.2 [71/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_f32_compute_bf16_knnn_instance.cpp.o 226.2 [72/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_compute_f32_knn_instance.cpp.o 226.4 [73/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_compute_f16_kkn_instance.cpp.o 228.4 [74/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_bf16_knnn_instance.cpp.o 230.0 [75/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_compute_f32_mkn_instance.cpp.o 230.6 [76/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_knn_instance.cpp.o 234.9 [77/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f64_f64_f64_compute_f32_mnn_instance.cpp.o 246.5 [78/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_compute_bf16_kkn_instance.cpp.o 271.8 [79/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_mkn_instance.cpp.o 273.7 [80/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_mnn_instance.cpp.o 276.0 [81/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_compute_f16_knn_instance.cpp.o 282.0 [82/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_compute_f16_mnn_instance.cpp.o 284.1 [83/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_compute_f16_mkn_instance.cpp.o 286.8 [84/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_bf16_compute_f32_kknn_instance.cpp.o 298.9 [85/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_compute_f32_kkn_instance.cpp.o 299.0 [86/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_kkn_instance.cpp.o 301.2 [87/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_compute_bf16_mnn_instance.cpp.o 302.0 [88/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_kkn_instance.cpp.o 310.5 [89/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_compute_bf16_knn_instance.cpp.o 315.1 [90/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f32_f32_f32_compute_bf16_mkn_instance.cpp.o 338.1 [91/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_compute_f32_kkn_instance.cpp.o 339.1 [92/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_mnn_instance.cpp.o 344.9 [93/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_mnn_instance.cpp.o 350.0 [94/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_kkn_instance.cpp.o 350.2 [95/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_compute_f32_knn_instance.cpp.o 351.6 [96/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_compute_f32_mnn_instance.cpp.o 353.6 [97/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_bf16_mknn_instance.cpp.o 354.5 [98/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_compute_f16_kkn_instance.cpp.o 358.1 [99/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_knn_instance.cpp.o 358.4 [100/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_mkn_instance.cpp.o 359.3 [101/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_bf16_mnnn_instance.cpp.o 360.1 [102/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_knn_instance.cpp.o 361.9 [103/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_compute_f32_mkn_instance.cpp.o 362.1 [104/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_f16_f16_f16_compute_f32_knn_instance.cpp.o 362.3 [105/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_compute_f32_mnn_instance.cpp.o 364.4 [106/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_compute_f32_kkn_instance.cpp.o 366.3 [107/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_kkn_instance.cpp.o 367.4 [108/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_knn_instance.cpp.o 368.4 [109/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_mkn_instance.cpp.o 371.1 [110/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_mnn_instance.cpp.o 371.1 [111/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f64_f64_f64_compute_f32_mkn_instance.cpp.o 380.8 [112/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_mkn_instance.cpp.o 385.1 [113/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_bf16_compute_f32_mnnn_instance.cpp.o 386.2 [114/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_compute_f32_mnn_instance.cpp.o 387.9 [115/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_bf16_compute_f32_mknn_instance.cpp.o 393.6 [116/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_compute_f32_mkn_instance.cpp.o 398.5 [117/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_kkn_instance.cpp.o 399.6 [118/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_bilinear/CMakeFiles/device_contraction_bilinear_instance.dir/6D/device_contraction_bilinear_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_bf16_compute_f32_knnn_instance.cpp.o 400.3 [119/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/2D/device_contraction_scale_m2_n2_k2_xdl_c_shuffle_bf16_bf16_bf16_compute_f32_knn_instance.cpp.o 421.9 [120/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_knn_instance.cpp.o 427.2 [121/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_compute_f16_mnn_instance.cpp.o 439.9 [122/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_compute_bf16_kkn_instance.cpp.o 448.7 [123/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_mkn_instance.cpp.o 451.6 [124/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_compute_f16_knn_instance.cpp.o 451.9 [125/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_compute_f32_kkn_instance.cpp.o 455.7 [126/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_mnn_instance.cpp.o 458.9 [127/1431] Building CXX object library/src/tensor_operation_instance/gpu/elementwise_normalization/CMakeFiles/device_elementwise_normalization_instance.dir/device_elementwise_normalization_f16_instance.cpp.o 463.2 [128/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_compute_f16_mkn_instance.cpp.o 463.7 [129/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_fwd/CMakeFiles/device_conv2d_fwd_instance.dir/device_conv2d_fwd_xdl_nhwc_kyxc_nhwk_f32_instance.cpp.o 465.0 [130/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv1d_bwd_data/CMakeFiles/device_conv1d_bwd_data_instance.dir/device_conv1d_bwd_data_xdl_nwc_kxc_nwk_f32_instance.cpp.o 486.3 [131/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_compute_f32_kkn_instance.cpp.o 487.5 [132/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_kkn_instance.cpp.o 493.5 [133/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_fwd/CMakeFiles/device_conv2d_fwd_instance.dir/device_conv2d_fwd_xdl_nhwc_kyxc_nhwk_f16_instance.cpp.o 497.0 [134/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_knn_instance.cpp.o 497.9 [135/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_compute_bf16_mnn_instance.cpp.o 499.7 [136/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_mnn_instance.cpp.o 501.0 [137/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_compute_f32_mkn_instance.cpp.o 503.5 [138/1431] Building CXX object library/src/tensor_operation_instance/gpu/elementwise/CMakeFiles/device_elementwise_instance.dir/device_normalize_instance.cpp.o 504.3 [139/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_compute_bf16_mkn_instance.cpp.o 506.3 [140/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f32_f32_f32_compute_bf16_knn_instance.cpp.o 522.4 [141/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_fwd/CMakeFiles/device_conv2d_fwd_instance.dir/device_conv2d_fwd_xdl_nhwc_kyxc_nhwk_bf16_instance.cpp.o 523.6 [142/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv1d_bwd_data/CMakeFiles/device_conv1d_bwd_data_instance.dir/device_conv1d_bwd_data_xdl_nwc_kxc_nwk_bf16_instance.cpp.o 529.6 [143/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv1d_bwd_data/CMakeFiles/device_conv1d_bwd_data_instance.dir/device_conv1d_bwd_data_xdl_nwc_kxc_nwk_f16_instance.cpp.o 533.1 [144/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_mkn_instance.cpp.o 534.3 [145/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_compute_f32_knn_instance.cpp.o 547.0 [146/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_fwd/CMakeFiles/device_conv2d_fwd_instance.dir/device_conv2d_fwd_xdl_nhwc_kyxc_nhwk_int8_instance.cpp.o 549.4 [147/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_f16_f16_f16_compute_f32_mnn_instance.cpp.o 558.6 [148/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_mnn_instance.cpp.o 585.5 [149/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_compute_f32_knn_instance.cpp.o 586.7 [150/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_knn_instance.cpp.o 588.3 [151/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_bwd_data/CMakeFiles/device_conv2d_bwd_data_instance.dir/device_conv2d_bwd_data_xdl_nhwc_kyxc_nhwk_f32_instance.cpp.o 589.6 [152/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_mkn_instance.cpp.o 604.0 [153/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_compute_f32_mkn_instance.cpp.o 618.4 [154/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f16_f32_f16_add.cpp.o 627.9 [155/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv1d_bwd_data/CMakeFiles/device_conv1d_bwd_data_instance.dir/device_conv1d_bwd_data_xdl_nwc_kxc_nwk_int8_instance.cpp.o 645.9 [156/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f64_f32_add.cpp.o 647.7 [157/1431] Building CXX object library/src/tensor_operation_instance/gpu/contraction_scale/CMakeFiles/device_contraction_scale_instance.dir/6D/device_contraction_scale_m6_n6_k6_xdl_c_shuffle_bf16_bf16_bf16_compute_f32_mnn_instance.cpp.o 649.0 [158/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_bwd_data/CMakeFiles/device_conv2d_bwd_data_instance.dir/device_conv2d_bwd_data_xdl_nhwc_kyxc_nhwk_f16_instance.cpp.o 651.7 [159/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f32_f32_avg.cpp.o 656.2 [160/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f16_f32_f16_add.cpp.o 658.3 [161/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f32_f32_norm2.cpp.o 663.5 [162/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f32_f32_add.cpp.o 664.6 [163/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f16_f32_f16_avg.cpp.o 666.7 [164/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_bwd_data/CMakeFiles/device_conv2d_bwd_data_instance.dir/device_conv2d_bwd_data_xdl_nhwc_kyxc_nhwk_bf16_instance.cpp.o 666.7 [165/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f16_f32_f16_norm2.cpp.o 668.9 [166/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv3d_bwd_data/CMakeFiles/device_conv3d_bwd_data_instance.dir/device_conv3d_bwd_data_xdl_ndhwc_kzyxc_ndhwk_f16_instance.cpp.o 671.8 [167/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f16_f16_f16_min.cpp.o 674.4 [168/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f16_f32_f16_avg.cpp.o 674.7 [169/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f16_f16_f16_amax.cpp.o 678.8 [170/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f16_f16_f16_max.cpp.o 689.3 [171/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f16_f32_f16_norm2.cpp.o 690.7 [172/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv3d_bwd_data/CMakeFiles/device_conv3d_bwd_data_instance.dir/device_conv3d_bwd_data_xdl_ndhwc_kzyxc_ndhwk_f32_instance.cpp.o 696.2 [173/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_bwd_data/CMakeFiles/device_conv2d_bwd_data_instance.dir/device_conv2d_bwd_data_xdl_nhwc_kyxc_nhwk_int8_instance.cpp.o 698.0 [174/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f64_f32_avg.cpp.o 705.9 [175/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f64_f32_norm2.cpp.o 710.3 [176/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f32_f32_add.cpp.o 710.6 [177/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f32_f32_avg.cpp.o 716.1 [178/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f32_f32_norm2.cpp.o 717.2 [179/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f64_f64_f64_add.cpp.o 724.5 [180/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f64_f64_f64_avg.cpp.o 726.8 [181/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f64_f32_avg.cpp.o 726.8 [182/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_i8_i32_i8_avg.cpp.o 728.4 [183/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f64_f32_norm2.cpp.o 729.1 [184/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f32_f32_amax.cpp.o 729.9 [185/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f32_f32_max.cpp.o 731.1 [186/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f64_f32_add.cpp.o 731.3 [187/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f64_f64_f64_norm2.cpp.o 731.8 [188/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f64_f64_f64_add.cpp.o 740.1 [189/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f64_f64_f64_norm2.cpp.o 741.8 [190/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f64_f64_f64_max.cpp.o 746.0 [191/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f32_f32_f32_min.cpp.o 746.2 [192/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f64_f64_f64_avg.cpp.o 748.1 [193/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_i8_i32_i8_avg.cpp.o 753.8 [194/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv3d_bwd_data/CMakeFiles/device_conv3d_bwd_data_instance.dir/device_conv3d_bwd_data_xdl_ndhwc_kzyxc_ndhwk_bf16_instance.cpp.o 757.8 [195/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_i8_i32_i8_add.cpp.o 758.6 [196/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_i8_i32_i8_add.cpp.o 760.0 [197/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f64_f64_f64_min.cpp.o 764.3 [198/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_i8_i8_i8_amax.cpp.o 766.0 [199/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_f64_f64_f64_amax.cpp.o 767.9 [200/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_b16_f32_b16_avg.cpp.o 768.1 [201/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_b16_f32_b16_avg.cpp.o 768.2 [202/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f16_f16_f16_min.cpp.o 773.4 [203/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_b16_f32_b16_add.cpp.o 774.2 [204/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_b16_f32_b16_amax.cpp.o 775.1 [205/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_i8_i8_i8_min.cpp.o 780.0 [206/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_b16_f32_b16_add.cpp.o 780.8 [207/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_b16_f32_b16_norm2.cpp.o 788.2 [208/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_i8_i8_i8_max.cpp.o 805.7 [209/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_b16_f32_b16_norm2.cpp.o 809.0 [210/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_b16_f32_b16_min.cpp.o 811.4 [211/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f16_f16_f16_max.cpp.o 817.2 [212/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f16_f16_f16_amax.cpp.o 817.6 [213/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_threadwise_b16_f32_b16_max.cpp.o 827.6 [214/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f16_f16_instance_rank4_reduce3.cpp.o 838.0 [215/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f16_f16_instance_rank3_reduce3.cpp.o 848.6 [216/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f16_f16_instance_rank3_reduce2.cpp.o 850.0 [217/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f16_f16_instance_rank3_reduce1.cpp.o 855.1 [218/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f32_f32_instance_rank3_reduce1.cpp.o 859.1 [219/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f16_f16_instance_rank4_reduce2.cpp.o 860.8 [220/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f32_f32_instance_rank4_reduce4.cpp.o 861.7 [221/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f16_f16_instance_rank4_reduce1.cpp.o 863.1 [222/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f32_f32_max.cpp.o 865.4 [223/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f32_f32_instance_rank4_reduce2.cpp.o 867.8 [224/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f32_f32_instance_rank3_reduce2.cpp.o 868.9 [225/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_2x_instance.cpp.o 871.1 [226/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f32_f32_min.cpp.o 873.3 [227/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f32_f32_instance_rank4_reduce1.cpp.o 874.6 [228/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f32_f32_instance_rank4_reduce3.cpp.o 876.6 [229/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv3d_bwd_data/CMakeFiles/device_conv3d_bwd_data_instance.dir/device_conv3d_bwd_data_xdl_ndhwc_kzyxc_ndhwk_int8_instance.cpp.o 877.8 [230/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f32_f32_instance_rank3_reduce3.cpp.o 882.2 [231/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_fwd/CMakeFiles/device_conv2d_fwd_instance.dir/device_conv2d_fwd_xdl_c_shuffle_nhwc_kyxc_nhwk_f16_instance.cpp.o 882.6 [232/1431] Building CXX object library/src/tensor_operation_instance/gpu/softmax/CMakeFiles/device_softmax_instance.dir/device_softmax_f16_f16_instance_rank4_reduce4.cpp.o 887.6 [233/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_comp_2x_instance.cpp.o 899.7 [234/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f64_f64_f64_min.cpp.o 906.4 [235/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_mem_v2_mnkpadding_instance.cpp.o 909.7 [236/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_f64_f64_f64_avg.cpp.o 910.0 [237/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f64_f64_f64_max.cpp.o 912.8 [238/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_b16_f32_b16_max.cpp.o 915.4 [239/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_comp_instance.cpp.o 919.5 [240/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_f16_f32_f32_add.cpp.o 925.0 [241/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_f32_f32_f32_avg.cpp.o 929.9 [242/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_f32_f32_f32_add.cpp.o 930.4 [243/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_16x16_instance.cpp.o 930.9 [244/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_f16_f32_f32_avg.cpp.o 931.1 [245/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_b16_f32_b16_min.cpp.o 931.2 [246/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_i8_i8_i8_min.cpp.o 932.7 [247/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_b16_f32_f32_avg.cpp.o 933.0 [248/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_mem_v2_default_instance.cpp.o 933.9 [249/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_mem_v1_default_instance.cpp.o 934.0 [250/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_b16_f32_f32_add.cpp.o 934.6 [251/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f32_tf32_instance.cpp.o 939.6 [252/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_16x16_instance.cpp.o 940.5 [253/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_i8_i8_i8_max.cpp.o 940.8 [254/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_f32_f64_f32_avg.cpp.o 941.2 [255/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_fwd_bias_relu/CMakeFiles/device_conv2d_fwd_bias_relu_instance.dir/device_conv2d_fwd_xdl_c_shuffle_bias_relu_nhwc_kyxc_nhwk_f16_instance.cpp.o 942.4 [256/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_16x16_instance.cpp.o 942.4 [257/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f64_f64_f64_amax.cpp.o 942.6 [258/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_f32_f64_f32_add.cpp.o 944.4 [259/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_16x16_instance.cpp.o 945.3 [260/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_multiblock_atomic_add_f64_f64_f64_add.cpp.o 945.9 [261/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_mem_v1_default_instance.cpp.o 948.2 [262/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f32_instance.cpp.o 954.9 [263/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_comp_mnkpadding_instance.cpp.o 956.5 [264/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_xdl_large_tensor_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 957.9 [265/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_mem_v2_default_instance.cpp.o 963.1 [266/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_xdl_large_tensor_nhwgc_gkyxc_nhwgk_int8_instance.cpp.o 964.5 [267/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_comp_mnkpadding_instance.cpp.o 965.5 [268/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_i8_i8_i8_amax.cpp.o 966.0 [269/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_mem_v2_mnkpadding_instance.cpp.o 966.2 [270/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_comp_default_instance.cpp.o 972.7 [271/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f16_instance.cpp.o 973.8 [272/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_comp_default_instance.cpp.o 975.1 [273/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instance.cpp.o 976.3 [274/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_instance.cpp.o 977.4 [275/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances.cpp.o 978.6 [276/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_20.cpp.o 979.4 [277/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_mem_v1_mnkpadding_instance.cpp.o 979.7 [278/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instance.cpp.o 979.8 [279/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_1.cpp.o 980.9 [280/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_2.cpp.o 983.0 [281/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_b16_f32_b16_amax.cpp.o 983.4 [282/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_mem_v1_mnkpadding_instance.cpp.o 983.5 [283/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_0.cpp.o 983.8 [284/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_3.cpp.o 983.8 [285/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_xdl_merged_groups_nhwgc_gkyxc_nhwgk_int8_instance.cpp.o 984.0 [286/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_tf32_instance.cpp.o 984.7 [287/1431] Building CXX object library/src/tensor_operation_instance/gpu/conv2d_fwd_bias_relu_add/CMakeFiles/device_conv2d_fwd_bias_relu_add_instance.dir/device_conv2d_fwd_xdl_c_shuffle_bias_relu_add_nhwc_kyxc_nhwk_f16_instance.cpp.o 988.6 [288/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_comp_instance.cpp.o 999.4 [289/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_11.cpp.o 1000.0 [290/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_comp_instance.cpp.o 1000.2 [291/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_7.cpp.o 1003.2 [292/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_4.cpp.o 1003.4 [293/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_2.cpp.o 1006.1 [294/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_1.cpp.o 1007.9 [295/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_9.cpp.o 1008.8 [296/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_6.cpp.o 1009.5 [297/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_3.cpp.o 1010.2 [298/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_0.cpp.o 1010.5 [299/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_12.cpp.o 1010.9 [300/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_20.cpp.o 1012.7 [301/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_16.cpp.o 1014.2 [302/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances.cpp.o 1015.9 [303/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_5.cpp.o 1017.1 [304/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_13.cpp.o 1017.2 [305/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_14.cpp.o 1018.7 [306/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_8.cpp.o 1020.8 [307/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_15.cpp.o 1023.2 [308/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_17.cpp.o 1025.1 [309/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_18.cpp.o 1025.5 [310/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_19.cpp.o 1025.8 [311/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_inter_instances_shard_10.cpp.o 1031.9 [312/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_11.cpp.o 1032.8 [313/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_8.cpp.o 1034.5 [314/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_14.cpp.o 1035.2 [315/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_16.cpp.o 1035.5 [316/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_12.cpp.o 1036.8 [317/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_6.cpp.o 1040.1 [318/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_5.cpp.o 1040.5 [319/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_9.cpp.o 1041.3 [320/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_7.cpp.o 1046.7 [321/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_xdl_merged_groups_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1047.2 [322/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_17.cpp.o 1047.3 [323/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_15.cpp.o 1048.3 [324/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_13.cpp.o 1049.3 [325/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_4.cpp.o 1053.7 [326/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f16_instance.cpp.o 1059.1 [327/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_18.cpp.o 1059.4 [328/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_19.cpp.o 1060.3 [329/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_mem_intra_instances_shard_10.cpp.o 1060.7 [330/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_v3_nhwgc_gkyxc_nhwgk_f16_instance.cpp.o 1061.4 [331/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_v3_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1069.5 [332/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load.cpp.o 1072.3 [333/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_odd_m_instance.cpp.o 1072.9 [334/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instance.cpp.o 1076.9 [335/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_instance.cpp.o 1080.2 [336/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_odd_mn_instance.cpp.o 1084.6 [337/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_odd_mn_instance.cpp.o 1085.4 [338/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instance.cpp.o 1087.3 [339/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load.cpp.o 1087.3 [340/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_nongroup_ported_f16_instance.cpp.o 1089.7 [341/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_nongroup_ported_bf16_instance.cpp.o 1090.0 [342/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/fp16_fp16_fp16/device_grouped_convnd_bwd_weight_xdl_f16_f16_f16_exp_odd_n_instance.cpp.o 1093.9 [343/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_comp_large_tensors_instance.cpp.o 1096.2 [344/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_instance.cpp.o 1099.4 [345/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_instance.cpp.o 1100.9 [346/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_odd_m_instance.cpp.o 1103.7 [347/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_convnd_bwd_weight/CMakeFiles/device_grouped_convnd_bwd_weight_instance.dir/explicit_xdl/bf16_bf16_bf16/device_grouped_convnd_bwd_weight_xdl_bf16_bf16_bf16_exp_odd_n_instance.cpp.o 1105.4 [348/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1126.3 [349/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_wavelet_default_instance.cpp.o 1129.9 [350/1431] Building CXX object library/src/tensor_operation_instance/gpu/reduce/CMakeFiles/device_reduce_instance.dir/device_reduce_instance_blockwise_f32_f32_f32_amax.cpp.o 1130.3 [351/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_wavelet_pad0_instance.cpp.o 1130.5 [352/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_pad0_pipev2_instance.cpp.o 1131.0 [353/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_wavelet_4w2_pad0_instance.cpp.o 1133.3 [354/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_wavelet_pad0_instance.cpp.o 1134.3 [355/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_wavelet_4w2_default_instance.cpp.o 1136.2 [356/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_wavelet_default_instance.cpp.o 1136.5 [357/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_wavelet_4w2_pad0_instance.cpp.o 1136.8 [358/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_comp_large_tensors_instance.cpp.o 1137.1 [359/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_default_pipev2_instance.cpp.o 1138.2 [360/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_pad0_pipev5_instance.cpp.o 1139.3 [361/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_large_tensors_instance.cpp.o 1139.6 [362/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_wavelet_4w2_default_instance.cpp.o 1148.4 [363/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instance.cpp.o 1149.7 [364/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_default_pipev5_instance.cpp.o 1150.4 [365/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_default_pipev2_instance.cpp.o 1152.6 [366/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_int8_comp_instance.cpp.o 1155.2 [367/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f16_16_16_instance.cpp.o 1162.4 [368/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_pad0_pipev2_instance.cpp.o 1169.6 [369/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_pad0_pipev5_instance.cpp.o 1175.2 [370/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_bf16_16_16_instance.cpp.o 1186.9 [371/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_2x_instance.cpp.o 1190.9 [372/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_comp_2x_instance.cpp.o 1199.1 [373/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_16_16_instance.cpp.o 1200.7 [374/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f32_16_16_instance.cpp.o 1209.8 [375/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_default_pipev5_instance.cpp.o 1211.1 [376/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_comp_instance.cpp.o 1226.5 [377/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_optimized_loads_instance.cpp.o 1231.8 [378/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_16x16_instance.cpp.o 1234.2 [379/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_16x16_instance.cpp.o 1238.6 [380/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_f32_bf16_instance.cpp.o 1245.4 [381/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f32_optimized_loads_instance.cpp.o 1246.6 [382/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_16x16_instance.cpp.o 1251.5 [383/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_f16_pipev1_part2_instance.cpp.o 1251.8 [384/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1258.9 [385/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_instance.cpp.o 1262.3 [386/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_bf16_pipev1_part2_instance.cpp.o 1266.1 [387/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_16x16_instance.cpp.o 1273.9 [388/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_fp32_instance.cpp.o 1290.8 [389/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_fp32_tf32_instance.cpp.o 1301.9 [390/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f16_optimized_loads_instance.cpp.o 1302.4 [391/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_fp16_instance.cpp.o 1308.0 [392/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_comp_instance.cpp.o 1308.2 [393/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1310.5 [394/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_bf16_optimized_loads_instance.cpp.o 1313.6 [395/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instance.cpp.o 1314.7 [396/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_pad0_pipev2_instance.cpp.o 1323.1 [397/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_direct_load_instance.cpp.o 1324.2 [398/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instance.cpp.o 1325.8 [399/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_bf16_pipev1_instance.cpp.o 1326.6 [400/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_f16_pipev1_instance.cpp.o 1328.2 [401/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_v3_nhwgc_gkyxc_nhwgk_f32_large_tensors_instance.cpp.o 1331.7 [402/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instance.cpp.o 1331.7 [403/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instance.cpp.o 1335.6 [404/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_comp_instance.cpp.o 1342.7 [405/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instance.cpp.o 1348.1 [406/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_pad0_pipev2_instance.cpp.o 1348.3 [407/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_instance.cpp.o 1359.5 [408/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_fp32_instance.cpp.o 1362.2 [409/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_fp32_tf32_instance.cpp.o 1390.5 [410/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_comp_instance.cpp.o 1392.1 [411/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_comp_2x_instance.cpp.o 1398.1 [412/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_2x_instance.cpp.o 1408.7 [413/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_default_pipev2_instance.cpp.o 1408.8 [414/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_16x16_instance.cpp.o 1409.1 [415/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_16x16_instance.cpp.o 1416.3 [416/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_default_pipev2_instance.cpp.o 1417.1 [417/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_16x16_instance.cpp.o 1418.7 [418/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1421.0 [419/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instance.cpp.o 1421.5 [420/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instance.cpp.o 1422.5 [421/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_16x16_instance.cpp.o 1434.9 [422/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instance.cpp.o 1435.9 [423/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_pad0_pipev5_instance.cpp.o 1436.5 [424/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_pad0_pipev5_instance.cpp.o 1438.1 [425/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1438.3 [426/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instance.cpp.o 1439.4 [427/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_instance.cpp.o 1440.5 [428/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_fp16_instance.cpp.o 1456.0 [429/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_instance.cpp.o 1458.2 [430/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_2x_instances.cpp.o 1461.9 [431/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_bias_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_fp16_instance.cpp.o 1462.7 [432/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_bias_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_fp32_instance.cpp.o 1469.1 [433/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_bias_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1469.7 [434/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/large_tensor/device_grouped_conv2d_fwd_bias_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_fp32_tf32_instance.cpp.o 1473.1 [435/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_instance.cpp.o 1479.2 [436/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instance.cpp.o 1481.8 [437/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instance.cpp.o 1484.0 [438/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f32_default_large_tensors_instance.cpp.o 1498.6 [439/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_bias_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_fp32_tf32_instance.cpp.o 1499.0 [440/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_direct_load_instance.cpp.o 1508.2 [441/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_bias_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_fp32_instance.cpp.o 1514.7 [442/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances.cpp.o 1520.8 [443/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_comp_instance.cpp.o 1524.3 [444/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instance.cpp.o 1529.2 [445/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_comp_instance.cpp.o 1536.2 [446/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instance.cpp.o 1536.9 [447/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_2x_instances_shard_0.cpp.o 1541.2 [448/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_v3_nhwgc_gkyxc_nhwgk_f16_large_tensors_instance.cpp.o 1544.1 [449/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instances.cpp.o 1545.1 [450/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_default_pipev5_instance.cpp.o 1548.6 [451/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_10.cpp.o 1549.6 [452/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_2x_instances.cpp.o 1553.6 [453/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_1.cpp.o 1554.0 [454/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_8.cpp.o 1554.3 [455/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_9.cpp.o 1558.8 [456/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_instances.cpp.o 1559.0 [457/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_2.cpp.o 1564.2 [458/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_default_pipev5_instance.cpp.o 1567.5 [459/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instance.cpp.o 1571.5 [460/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_7.cpp.o 1581.6 [461/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_bf16_pipev5_instance.cpp.o 1584.7 [462/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_v3_nhwgc_gkyxc_nhwgk_bf16_large_tensors_instance.cpp.o 1593.7 [463/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_f16_pipev2_instance.cpp.o 1597.4 [464/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_bias_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1599.5 [465/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances.cpp.o 1605.2 [466/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_f16_default_large_tensors_instance.cpp.o 1607.1 [467/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/merged_groups/device_grouped_conv2d_fwd_bias_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_fp16_instance.cpp.o 1610.5 [468/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instances_shard_3.cpp.o 1616.1 [469/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_instance.cpp.o 1618.7 [470/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_2x_instances_shard_0.cpp.o 1619.3 [471/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_bf16_pipev2_irregular_instance.cpp.o 1619.5 [472/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_instance.cpp.o 1619.5 [473/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_comp_instances.cpp.o 1622.1 [474/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_1.cpp.o 1624.3 [475/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_f16_pipev2_irregular_instance.cpp.o 1634.6 [476/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_comp_instances.cpp.o 1639.1 [477/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_instance.cpp.o 1640.3 [478/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_xdl_nhwgc_gkyxc_nhwgk_bf16_default_large_tensors_instance.cpp.o 1642.2 [479/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_instances_shard_0.cpp.o 1645.3 [480/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instances_shard_4.cpp.o 1645.5 [481/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_f16_pipev5_instance.cpp.o 1651.1 [482/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_16x16_instances.cpp.o 1651.5 [483/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_5.cpp.o 1653.9 [484/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_7.cpp.o 1656.0 [485/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1657.8 [486/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_bf16_pipev2_instance.cpp.o 1661.2 [487/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_6.cpp.o 1661.8 [488/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_bf16_large_tensors_instance.cpp.o 1664.7 [489/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_16x16_instances_shard_0.cpp.o 1665.9 [490/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_16x16_instances_shard_1.cpp.o 1666.1 [491/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_16x16_instances_shard_2.cpp.o 1670.9 [492/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_11.cpp.o 1671.2 [493/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_comp_instances_shard_0.cpp.o 1677.2 [494/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_comp_instances_shard_1.cpp.o 1677.4 [495/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_16x16_instances_shard_3.cpp.o 1678.9 [496/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_8.cpp.o 1680.5 [497/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_comp_instances_shard_1.cpp.o 1687.2 [498/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances.cpp.o 1688.0 [499/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_comp_instances_shard_0.cpp.o 1690.0 [500/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_1.cpp.o 1693.7 [501/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_comp_instances_shard_3.cpp.o 1693.9 [502/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_f16_large_tensors_instance.cpp.o 1694.6 [503/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_10.cpp.o 1696.0 [504/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_6.cpp.o 1696.9 [505/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_16x16_instances.cpp.o 1698.5 [506/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_10.cpp.o 1698.9 [507/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_mem_inter_instance.cpp.o 1699.8 [508/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_7.cpp.o 1700.5 [509/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_3.cpp.o 1701.3 [510/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_2.cpp.o 1701.4 [511/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_11.cpp.o 1701.4 [512/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_9.cpp.o 1702.1 [513/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_13.cpp.o 1702.2 [514/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_5.cpp.o 1702.4 [515/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_8.cpp.o 1702.4 [516/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_comp_instances_shard_3.cpp.o 1704.0 [517/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_12.cpp.o 1704.7 [518/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_4.cpp.o 1705.1 [519/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_comp_instances_shard_2.cpp.o 1705.1 [520/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_0.cpp.o 1705.6 [521/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_mem_intra_instance.cpp.o 1706.1 [522/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_14.cpp.o 1707.5 [523/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_instances_shard_15.cpp.o 1707.8 [524/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_f16_pipev5_irregular_instance.cpp.o 1709.9 [525/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_9.cpp.o 1711.8 [526/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances.cpp.o 1712.9 [527/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_16x16_instances_shard_2.cpp.o 1713.2 [528/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instance.cpp.o 1713.3 [529/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_16x16_instances_shard_1.cpp.o 1714.7 [530/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_16x16_instances.cpp.o 1715.3 [531/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_16x16_instances_shard_0.cpp.o 1715.9 [532/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_comp_instances_shard_2.cpp.o 1717.8 [533/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_16x16_instances_shard_3.cpp.o 1723.1 [534/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_3.cpp.o 1723.3 [535/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_mem_intra_instance.cpp.o 1731.8 [536/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_6.cpp.o 1732.3 [537/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_1.cpp.o 1732.8 [538/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_13.cpp.o 1735.2 [539/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_12.cpp.o 1735.3 [540/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_2.cpp.o 1735.7 [541/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_15.cpp.o 1736.0 [542/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_11.cpp.o 1736.5 [543/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_3.cpp.o 1737.5 [544/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_14.cpp.o 1737.7 [545/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_weight/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_weight_nhwgc_instance.dir/xdl/nhwgc_gkyxc_nhwgk/device_grouped_conv2d_bwd_weight_two_stage_xdl_nhwgc_gkyxc_nhwgk_bf16_pipev5_irregular_instance.cpp.o 1737.7 [546/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_16x16_instances_shard_2.cpp.o 1737.9 [547/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_5.cpp.o 1738.2 [548/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_10.cpp.o 1738.4 [549/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_mem_inter_instance.cpp.o 1739.0 [550/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_4.cpp.o 1739.2 [551/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_9.cpp.o 1739.7 [552/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_2.cpp.o 1740.0 [553/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_7.cpp.o 1740.0 [554/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instances_shard_2.cpp.o 1740.0 [555/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instances_shard_1.cpp.o 1741.2 [556/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_16x16_instances_shard_1.cpp.o 1741.4 [557/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_1.cpp.o 1741.6 [558/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_8.cpp.o 1741.9 [559/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances.cpp.o 1742.6 [560/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_16x16_instances_shard_0.cpp.o 1745.9 [561/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_10.cpp.o 1745.9 [562/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_16x16_instances.cpp.o 1747.7 [563/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_6.cpp.o 1748.0 [564/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_instances_shard_0.cpp.o 1748.5 [565/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_11.cpp.o 1748.9 [566/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_9.cpp.o 1748.9 [567/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_7.cpp.o 1749.3 [568/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_8.cpp.o 1751.0 [569/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_5.cpp.o 1751.4 [570/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_12.cpp.o 1751.8 [571/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_4.cpp.o 1751.8 [572/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances.cpp.o 1752.8 [573/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_3.cpp.o 1754.3 [574/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_14.cpp.o 1754.4 [575/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_2.cpp.o 1755.1 [576/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_bf16_instances.cpp.o 1755.6 [577/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_13.cpp.o 1756.8 [578/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_5.cpp.o 1759.1 [579/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f16_instances.cpp.o 1759.2 [580/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_mem_inter_instance.cpp.o 1759.6 [581/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f32_instances.cpp.o 1760.1 [582/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_part2_instances_shard_0.cpp.o 1760.7 [583/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_15.cpp.o 1762.2 [584/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_6.cpp.o 1762.8 [585/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f32_tf32_instances.cpp.o 1763.4 [586/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_16x16_instances_shard_2.cpp.o 1765.9 [587/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_4.cpp.o 1767.1 [588/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_16x16_instances_shard_1.cpp.o 1768.7 [589/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_6.cpp.o 1769.2 [590/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_16x16_instances_shard_0.cpp.o 1769.5 [591/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_13.cpp.o 1769.8 [592/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_7.cpp.o 1771.3 [593/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_1.cpp.o 1772.0 [594/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_11.cpp.o 1772.8 [595/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_instances_shard_0.cpp.o 1773.7 [596/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_1.cpp.o 1773.8 [597/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_9.cpp.o 1773.9 [598/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_10.cpp.o 1774.0 [599/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_2.cpp.o 1774.0 [600/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_8.cpp.o 1774.4 [601/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances.cpp.o 1774.5 [602/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_14.cpp.o 1774.9 [603/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_2.cpp.o 1775.1 [604/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_4.cpp.o 1775.5 [605/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_3.cpp.o 1775.5 [606/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_12.cpp.o 1776.2 [607/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_15.cpp.o 1776.6 [608/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instance.cpp.o 1776.9 [609/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_7.cpp.o 1777.3 [610/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_comp_part2_instance.cpp.o 1777.6 [611/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_0.cpp.o 1777.6 [612/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_6.cpp.o 1778.7 [613/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_5.cpp.o 1779.2 [614/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_8.cpp.o 1779.3 [615/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f32_instances_shard_1.cpp.o 1779.4 [616/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_4.cpp.o 1779.5 [617/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_5.cpp.o 1779.5 [618/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_10.cpp.o 1779.6 [619/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_9.cpp.o 1779.9 [620/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_bf16_instances_shard_0.cpp.o 1780.5 [621/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_bf16_instances_shard_2.cpp.o 1781.4 [622/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_3.cpp.o 1782.8 [623/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_bf16_instances_shard_1.cpp.o 1782.9 [624/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_1.cpp.o 1782.9 [625/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f16_instances_shard_2.cpp.o 1783.1 [626/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_0.cpp.o 1783.3 [627/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_direct_load_instances_shard_11.cpp.o 1783.7 [628/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f32_instances_shard_0.cpp.o 1785.5 [629/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances.cpp.o 1786.5 [630/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f16_instances_shard_0.cpp.o 1789.9 [631/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_large_tensor_nhwgc_gkyxc_nhwgk_f16_instances_shard_1.cpp.o 1792.9 [632/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_0.cpp.o 1792.9 [633/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances.cpp.o 1799.7 [634/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_1.cpp.o 1800.3 [635/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_2.cpp.o 1800.5 [636/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_0.cpp.o 1802.2 [637/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_1.cpp.o 1803.1 [638/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_3.cpp.o 1804.1 [639/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instance.cpp.o 1805.4 [640/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_2.cpp.o 1807.4 [641/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_0.cpp.o 1808.2 [642/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_2.cpp.o 1808.5 [643/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_12.cpp.o 1809.3 [644/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_instance.cpp.o 1809.7 [645/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_0.cpp.o 1810.7 [646/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_3.cpp.o 1811.9 [647/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_5.cpp.o 1811.9 [648/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_11.cpp.o 1812.0 [649/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_4.cpp.o 1812.3 [650/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_1.cpp.o 1813.0 [651/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_14.cpp.o 1813.2 [652/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_3.cpp.o 1814.2 [653/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances.cpp.o 1814.9 [654/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_13.cpp.o 1816.1 [655/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_10.cpp.o 1816.5 [656/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_14.cpp.o 1816.7 [657/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_7.cpp.o 1816.7 [658/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_6.cpp.o 1816.8 [659/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_9.cpp.o 1817.0 [660/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_12.cpp.o 1819.1 [661/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_8.cpp.o 1819.3 [662/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_8.cpp.o 1819.7 [663/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_9.cpp.o 1819.9 [664/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_9.cpp.o 1820.0 [665/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_13.cpp.o 1820.1 [666/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_11.cpp.o 1820.6 [667/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_16.cpp.o 1820.6 [668/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_10.cpp.o 1821.1 [669/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_10.cpp.o 1821.2 [670/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_mem_inter_instance.cpp.o 1821.7 [671/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_15.cpp.o 1824.0 [672/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_direct_load_instances_shard_11.cpp.o 1824.3 [673/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_tf32_mem_intra_instance.cpp.o 1824.7 [674/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_15.cpp.o 1825.0 [675/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_7.cpp.o 1825.8 [676/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_18.cpp.o 1826.1 [677/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_19.cpp.o 1826.2 [678/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_5.cpp.o 1826.3 [679/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_8.cpp.o 1827.6 [680/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_17.cpp.o 1828.2 [681/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances.cpp.o 1831.3 [682/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_6.cpp.o 1831.5 [683/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_5.cpp.o 1831.7 [684/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_7.cpp.o 1832.0 [685/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_mem_inter_instance.cpp.o 1832.0 [686/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_16.cpp.o 1832.4 [687/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_19.cpp.o 1833.2 [688/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instances_shard_4.cpp.o 1833.6 [689/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_18.cpp.o 1834.0 [690/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp32_mem_intra_instance.cpp.o 1838.9 [691/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_17.cpp.o 1839.0 [692/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_4.cpp.o 1839.1 [693/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instances_shard_6.cpp.o 1839.3 [694/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_2.cpp.o 1839.9 [695/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_3.cpp.o 1840.5 [696/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances.cpp.o 1840.8 [697/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_0.cpp.o 1840.8 [698/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_1.cpp.o 1841.1 [699/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_0.cpp.o 1847.3 [700/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_12.cpp.o 1849.3 [701/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_comp_part2_instances_shard_3.cpp.o 1849.3 [702/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_11.cpp.o 1850.2 [703/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_2.cpp.o 1850.4 [704/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances.cpp.o 1850.7 [705/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_3.cpp.o 1850.8 [706/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_mem_intra_instance.cpp.o 1852.9 [707/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_14.cpp.o 1853.2 [708/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_13.cpp.o 1853.3 [709/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_0.cpp.o 1853.5 [710/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_10.cpp.o 1854.3 [711/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_1.cpp.o 1854.7 [712/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_0.cpp.o 1856.3 [713/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_8.cpp.o 1856.6 [714/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_9.cpp.o 1859.3 [715/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_12.cpp.o 1859.5 [716/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_15.cpp.o 1860.0 [717/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_4.cpp.o 1860.2 [718/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_5.cpp.o 1862.1 [719/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_13.cpp.o 1862.5 [720/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_16.cpp.o 1863.1 [721/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_2.cpp.o 1863.5 [722/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_14.cpp.o 1863.6 [723/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/comp/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instances_shard_4.cpp.o 1864.3 [724/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_10.cpp.o 1865.1 [725/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_0.cpp.o 1865.6 [726/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_9.cpp.o 1865.7 [727/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_8.cpp.o 1865.8 [728/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_11.cpp.o 1866.2 [729/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_3.cpp.o 1866.3 [730/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_7.cpp.o 1868.0 [731/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_15.cpp.o 1869.4 [732/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_18.cpp.o 1869.8 [733/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances.cpp.o 1870.4 [734/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_17.cpp.o 1870.6 [735/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_5.cpp.o 1870.8 [736/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_1.cpp.o 1873.8 [737/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_8.cpp.o 1874.0 [738/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_19.cpp.o 1874.6 [739/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_7.cpp.o 1875.1 [740/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_16.cpp.o 1875.6 [741/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_10.cpp.o 1875.7 [742/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_inter_instances_shard_6.cpp.o 1876.0 [743/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_11.cpp.o 1877.1 [744/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_18.cpp.o 1879.4 [745/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_4.cpp.o 1879.8 [746/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_6.cpp.o 1880.7 [747/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_19.cpp.o 1880.8 [748/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f16_mem_intra_instances_shard_17.cpp.o 1881.6 [749/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances.cpp.o 1882.8 [750/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_12.cpp.o 1883.5 [751/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_7.cpp.o 1883.8 [752/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_2.cpp.o 1884.2 [753/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_6.cpp.o 1884.3 [754/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_3.cpp.o 1884.6 [755/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_0.cpp.o 1884.7 [756/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_comp_instance.cpp.o 1886.4 [757/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_9.cpp.o 1888.2 [758/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_1.cpp.o 1889.5 [759/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_13.cpp.o 1892.1 [760/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_2.cpp.o 1892.8 [761/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances.cpp.o 1893.0 [762/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_14.cpp.o 1893.3 [763/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_10.cpp.o 1893.3 [764/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_11.cpp.o 1893.6 [765/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_bf16_instances.cpp.o 1894.9 [766/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_0.cpp.o 1895.7 [767/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_8.cpp.o 1896.4 [768/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_3.cpp.o 1896.7 [769/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_1.cpp.o 1896.7 [770/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f16_instances.cpp.o 1897.1 [771/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_12.cpp.o 1898.1 [772/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_9.cpp.o 1899.8 [773/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_5.cpp.o 1900.1 [774/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_7.cpp.o 1900.5 [775/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_inter_instance.cpp.o 1900.8 [776/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_10.cpp.o 1900.9 [777/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_15.cpp.o 1902.6 [778/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_instances.cpp.o 1903.3 [779/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_11.cpp.o 1903.5 [780/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_2.cpp.o 1903.6 [781/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_8.cpp.o 1904.2 [782/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_tf32_instances.cpp.o 1905.2 [783/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_6.cpp.o 1905.5 [784/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_inter_instances_shard_4.cpp.o 1905.6 [785/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_0.cpp.o 1906.3 [786/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_14.cpp.o 1906.7 [787/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_1.cpp.o 1906.7 [788/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_12.cpp.o 1907.5 [789/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_13.cpp.o 1907.9 [790/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_3.cpp.o 1911.0 [791/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_mem_inter_instance.cpp.o 1911.4 [792/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_9.cpp.o 1912.6 [793/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_7.cpp.o 1913.4 [794/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_8.cpp.o 1914.0 [795/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_10.cpp.o 1914.0 [796/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_mem_intra_instance.cpp.o 1914.2 [797/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_13.cpp.o 1915.2 [798/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_5.cpp.o 1915.3 [799/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_6.cpp.o 1916.1 [800/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_11.cpp.o 1919.1 [801/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_12.cpp.o 1919.3 [802/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_14.cpp.o 1921.9 [803/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_7.cpp.o 1922.2 [804/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_9.cpp.o 1922.6 [805/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_15.cpp.o 1923.8 [806/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_instances_shard_0.cpp.o 1923.9 [807/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_6.cpp.o 1925.2 [808/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_mem_intra_instances_shard_4.cpp.o 1926.4 [809/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_5.cpp.o 1926.7 [810/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_13.cpp.o 1928.1 [811/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_instances_shard_2.cpp.o 1928.2 [812/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_instances_shard_1.cpp.o 1928.3 [813/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/mem/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_bf16_mem_intra_instance.cpp.o 1928.7 [814/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_1.cpp.o 1929.0 [815/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_4.cpp.o 1929.1 [816/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_2.cpp.o 1929.8 [817/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_inter_instances_shard_15.cpp.o 1930.1 [818/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f32_tf32_instances_shard_0.cpp.o 1930.9 [819/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_14.cpp.o 1937.0 [820/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_5.cpp.o 1938.9 [821/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_11.cpp.o 1939.7 [822/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances.cpp.o 1941.3 [823/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_15.cpp.o 1942.2 [824/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/mem/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_nhwgc_gkyxc_nhwgk_f32_tf32_mem_intra_instances_shard_4.cpp.o 1944.6 [825/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 1944.8 [826/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_16x16_instance.cpp.o 1945.1 [827/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16x16_instance.cpp.o 1945.2 [828/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_16x16_instance.cpp.o 1945.9 [829/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 1949.2 [830/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_16x16_instance.cpp.o 1950.3 [831/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 1952.2 [832/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 1954.1 [833/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f16_instances_shard_1.cpp.o 1954.6 [834/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f16_instances_shard_2.cpp.o 1956.8 [835/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_bf16_instances_shard_2.cpp.o 1959.3 [836/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_dynamic_op/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_dynamic_op_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_dynamic_op_nhwgc_gkyxc_nhwgk_f32_instance.cpp.o 1959.4 [837/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 1959.6 [838/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_bf16_instances_shard_1.cpp.o 1959.8 [839/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances.cpp.o 1960.7 [840/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 1964.7 [841/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_10.cpp.o 1966.8 [842/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_9.cpp.o 1968.6 [843/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_8.cpp.o 1968.8 [844/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 1968.9 [845/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_dynamic_op/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_dynamic_op_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_dynamic_op_nhwgc_gkyxc_nhwgk_f16_instance.cpp.o 1971.2 [846/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_7.cpp.o 1971.5 [847/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_5.cpp.o 1971.7 [848/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 1971.8 [849/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_dynamic_op/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_dynamic_op_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_dynamic_op_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 1975.0 [850/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_dynamic_op/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_dynamic_op_nhwgc_instance.dir/xdl/device_grouped_conv2d_fwd_xdl_dynamic_op_nhwgc_gkyxc_nhwgk_int8_instance.cpp.o 1975.7 [851/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_1.cpp.o 1976.8 [852/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_6.cpp.o 1977.3 [853/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_f16_instances_shard_0.cpp.o 1981.6 [854/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_bnorm_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_bnorm_clamp_nhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv2d_fwd_bias_bn_clamp_xdl_merged_groups_nhwgc_gkyxc_nhwgk_bf16_instances_shard_0.cpp.o 1986.3 [855/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_7.cpp.o 1987.1 [856/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_2.cpp.o 1990.6 [857/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_4.cpp.o 1991.9 [858/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_3.cpp.o 1992.0 [859/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_9.cpp.o 1992.2 [860/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_10.cpp.o 1994.8 [861/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_11.cpp.o 1995.6 [862/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_comp_instance.cpp.o 1996.8 [863/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_comp_instance.cpp.o 1999.4 [864/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_8.cpp.o 2004.5 [865/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_5.cpp.o 2006.0 [866/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_3.cpp.o 2015.0 [867/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_2.cpp.o 2015.3 [868/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_6.cpp.o 2025.8 [869/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_1.cpp.o 2026.0 [870/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_0.cpp.o 2028.0 [871/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_4.cpp.o 2033.2 [872/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_0.cpp.o 2037.9 [873/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_fwd_bias_clamp/nhwgc/CMakeFiles/device_grouped_conv2d_fwd_bias_clamp_nhwgc_instance.dir/xdl/comp/device_grouped_conv2d_fwd_bias_clamp_xdl_nhwgc_gkyxc_nhwgk_fp16_comp_part2_instance.cpp.o 2056.3 [874/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 2056.9 [875/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2059.9 [876/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2063.6 [877/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2063.7 [878/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_int8_instance.cpp.o 2067.5 [879/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16_16_instance.cpp.o 2081.6 [880/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_wavelet_pad0_instance.cpp.o 2081.6 [881/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f16_16_16_instance.cpp.o 2082.0 [882/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_comp_large_tensors_instance.cpp.o 2082.5 [883/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_fp8_instance.cpp.o 2083.5 [884/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_wavelet_default_instance.cpp.o 2084.0 [885/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf8_instance.cpp.o 2084.0 [886/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f32_16_16_instance.cpp.o 2088.0 [887/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_fp8_bf8_instance.cpp.o 2091.5 [888/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_16_16_instance.cpp.o 2094.4 [889/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf8_fp8_instance.cpp.o 2095.0 [890/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_wavelet_default_instance.cpp.o 2095.2 [891/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_pad0_pipev2_instance.cpp.o 2099.0 [892/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_wavelet_pad0_instance.cpp.o 2101.5 [893/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_pad0_pipev5_instance.cpp.o 2101.7 [894/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_fp8_instance.cpp.o 2105.1 [895/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f32_optimized_loads_instance.cpp.o 2105.6 [896/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_default_pipev2_instance.cpp.o 2111.7 [897/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_pad0_pipev2_instance.cpp.o 2115.3 [898/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_optimized_loads_instance.cpp.o 2118.3 [899/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_pad0_pipev5_instance.cpp.o 2122.9 [900/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_default_pipev5_instance.cpp.o 2129.4 [901/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_default_pipev2_instance.cpp.o 2130.5 [902/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_large_tensors_instance.cpp.o 2136.1 [903/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f16_optimized_loads_instance.cpp.o 2136.2 [904/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_optimized_loads_instance.cpp.o 2141.7 [905/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f16_instance.cpp.o 2145.7 [906/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_large_tensors_instance.cpp.o 2149.0 [907/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_pipev1_part2_instance.cpp.o 2149.2 [908/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_default_pipev5_instance.cpp.o 2152.2 [909/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_f32_bf16_instance.cpp.o 2152.9 [910/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2153.1 [911/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2156.2 [912/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_f16_pipev1_part2_instance.cpp.o 2158.1 [913/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_bf16_instance.cpp.o 2166.5 [914/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16x16_instance.cpp.o 2173.7 [915/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_16x16_instance.cpp.o 2174.1 [916/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_pipev1_instance.cpp.o 2177.1 [917/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_16x16_instance.cpp.o 2185.8 [918/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_16x16_instance.cpp.o 2186.9 [919/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_f16_pipev1_instance.cpp.o 2191.5 [920/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_fp32_instance.cpp.o 2193.4 [921/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_instance.cpp.o 2195.1 [922/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_pad0_pipev2_instance.cpp.o 2198.0 [923/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instance.cpp.o 2201.3 [924/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instance.cpp.o 2202.7 [925/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instance.cpp.o 2202.8 [926/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2203.5 [927/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_fp16_instance.cpp.o 2207.3 [928/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instance.cpp.o 2211.3 [929/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_pad0_pipev2_instance.cpp.o 2216.1 [930/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_comp_instance.cpp.o 2218.0 [931/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_comp_instance.cpp.o 2231.2 [932/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_fp32_instance.cpp.o 2233.1 [933/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_instance.cpp.o 2235.6 [934/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 2238.0 [935/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2238.4 [936/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_v3_ndhwgc_gkzyxc_ndhwgk_f32_large_tensors_instance.cpp.o 2240.1 [937/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2241.0 [938/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2244.3 [939/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_pad0_pipev5_instance.cpp.o 2245.3 [940/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_fp16_instance.cpp.o 2249.7 [941/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instance.cpp.o 2250.1 [942/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 2250.8 [943/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2252.1 [944/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16x16_instance.cpp.o 2252.3 [945/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_pad0_pipev5_instance.cpp.o 2259.0 [946/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_16x16_instance.cpp.o 2259.2 [947/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instance.cpp.o 2259.4 [948/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scale_ndhwgc_gkzyxc_ndhwgk_int8_instance.cpp.o 2267.6 [949/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_bf8_fp8_instance.cpp.o 2268.9 [950/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_default_pipev2_instance.cpp.o 2270.5 [951/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scale_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2272.5 [952/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_16x16_instance.cpp.o 2272.9 [953/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_default_pipev2_instance.cpp.o 2274.4 [954/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_16x16_instance.cpp.o 2279.0 [955/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_bias_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_fp32_instance.cpp.o 2280.1 [956/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_instance.cpp.o 2283.1 [957/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_2x_instances.cpp.o 2285.1 [958/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_bias_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_instance.cpp.o 2291.2 [959/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_bias_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2295.0 [960/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/large_tensor/device_grouped_conv3d_fwd_bias_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_fp16_instance.cpp.o 2296.4 [961/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_instance.cpp.o 2296.7 [962/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_instance.cpp.o 2299.2 [963/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f32_default_large_tensors_instance.cpp.o 2299.7 [964/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instance.cpp.o 2300.5 [965/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2303.6 [966/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_bias_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_fp32_instance.cpp.o 2305.8 [967/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_bias_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_instance.cpp.o 2308.0 [968/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_comp_instance.cpp.o 2309.0 [969/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances.cpp.o 2310.3 [970/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_comp_instance.cpp.o 2312.6 [971/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_bias_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2312.6 [972/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instance.cpp.o 2319.0 [973/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/merged_groups/device_grouped_conv3d_fwd_bias_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_fp16_instance.cpp.o 2321.5 [974/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_part2_instances.cpp.o 2327.3 [975/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_2x_instances_shard_0.cpp.o 2327.8 [976/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_2x_instances.cpp.o 2329.1 [977/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2330.2 [978/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_2.cpp.o 2334.0 [979/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_10.cpp.o 2336.3 [980/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances.cpp.o 2337.5 [981/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_9.cpp.o 2337.5 [982/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_8.cpp.o 2341.0 [983/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2341.7 [984/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_1.cpp.o 2341.7 [985/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_f16_pipev2_irregular_instance.cpp.o 2347.0 [986/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_pipev2_irregular_instance.cpp.o 2351.5 [987/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_7.cpp.o 2355.3 [988/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_default_pipev5_instance.cpp.o 2357.2 [989/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_part2_instances_shard_3.cpp.o 2360.6 [990/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_2x_instances_shard_0.cpp.o 2363.1 [991/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances.cpp.o 2368.2 [992/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_default_pipev5_instance.cpp.o 2371.5 [993/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2372.6 [994/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_v3_ndhwgc_gkzyxc_ndhwgk_f16_large_tensors_instance.cpp.o 2375.8 [995/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_instance.cpp.o 2376.9 [996/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 2377.3 [997/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_1.cpp.o 2378.4 [998/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_instances_shard_0.cpp.o 2379.5 [999/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_part2_instances_shard_4.cpp.o 2380.8 [1000/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_comp_instances.cpp.o 2386.7 [1001/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2386.9 [1002/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_comp_instances.cpp.o 2388.2 [1003/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_7.cpp.o 2390.2 [1004/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_instance.cpp.o 2390.4 [1005/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_v3_ndhwgc_gkzyxc_ndhwgk_bf16_large_tensors_instance.cpp.o 2392.0 [1006/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_instance.cpp.o 2393.2 [1007/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_5.cpp.o 2397.0 [1008/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16x16_instances.cpp.o 2399.0 [1009/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_6.cpp.o 2399.8 [1010/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_f16_default_large_tensors_instance.cpp.o 2401.8 [1011/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_8.cpp.o 2402.3 [1012/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_11.cpp.o 2406.4 [1013/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_comp_instances_shard_0.cpp.o 2407.6 [1014/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_comp_instances_shard_1.cpp.o 2408.1 [1015/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_pipev2_instance.cpp.o 2408.9 [1016/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_f16_pipev2_instance.cpp.o 2410.5 [1017/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16x16_instances_shard_1.cpp.o 2410.5 [1018/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv2d_bwd_data/nhwgc/CMakeFiles/device_grouped_conv2d_bwd_data_nhwgc_instance.dir/xdl/device_grouped_conv2d_bwd_data_xdl_nhwgc_gkyxc_nhwgk_f32_instance.cpp.o 2410.7 [1019/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16x16_instances_shard_0.cpp.o 2410.8 [1020/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_pipev5_instance.cpp.o 2413.8 [1021/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16x16_instances_shard_2.cpp.o 2413.9 [1022/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_16x16_instances_shard_3.cpp.o 2416.1 [1023/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_ndhwgc_gkzyxc_ndhwgk_input_f16_comp_bf8_f8_instance.cpp.o 2419.1 [1024/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances.cpp.o 2420.7 [1025/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_comp_instances_shard_3.cpp.o 2421.9 [1026/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_comp_instances_shard_1.cpp.o 2423.3 [1027/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_f16_pipev5_instance.cpp.o 2424.1 [1028/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_9.cpp.o 2425.2 [1029/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_comp_instances_shard_0.cpp.o 2425.3 [1030/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_1.cpp.o 2428.9 [1031/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_2.cpp.o 2429.4 [1032/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_16x16_instances.cpp.o 2430.4 [1033/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_6.cpp.o 2431.0 [1034/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_comp_instances_shard_3.cpp.o 2431.3 [1035/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_3.cpp.o 2432.1 [1036/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_10.cpp.o 2434.1 [1037/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_comp_instances_shard_2.cpp.o 2434.7 [1038/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_8.cpp.o 2434.7 [1039/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_4.cpp.o 2435.0 [1040/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_default_large_tensors_instance.cpp.o 2436.0 [1041/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_mem_inter_instance.cpp.o 2436.6 [1042/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_large_tensors_instance.cpp.o 2436.8 [1043/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_10.cpp.o 2437.2 [1044/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_5.cpp.o 2437.7 [1045/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_7.cpp.o 2438.1 [1046/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_11.cpp.o 2438.7 [1047/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_15.cpp.o 2438.7 [1048/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_9.cpp.o 2438.7 [1049/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_13.cpp.o 2439.0 [1050/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_0.cpp.o 2439.8 [1051/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_12.cpp.o 2441.8 [1052/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_16x16_instances_shard_1.cpp.o 2443.8 [1053/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_14.cpp.o 2443.8 [1054/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_16x16_instances_shard_2.cpp.o 2444.1 [1055/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_16x16_instances_shard_3.cpp.o 2444.4 [1056/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_f16_large_tensors_instance.cpp.o 2445.3 [1057/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_16x16_instances_shard_0.cpp.o 2446.3 [1058/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances.cpp.o 2446.4 [1059/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_3.cpp.o 2447.2 [1060/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_16x16_instances.cpp.o 2447.2 [1061/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_comp_instances_shard_2.cpp.o 2450.6 [1062/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_mem_intra_instance.cpp.o 2452.2 [1063/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_pipev5_irregular_instance.cpp.o 2454.9 [1064/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_mem_intra_instance.cpp.o 2455.8 [1065/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_1.cpp.o 2457.7 [1066/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_part2_instances_shard_1.cpp.o 2459.3 [1067/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_6.cpp.o 2460.5 [1068/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_2.cpp.o 2460.8 [1069/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_ndhwgc_instance.dir/xdl/ndhwgc_gkzyxc_ndhwgk/device_grouped_conv3d_bwd_weight_two_stage_xdl_ndhwgc_gkzyxc_ndhwgk_f16_pipev5_irregular_instance.cpp.o 2461.0 [1070/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances.cpp.o 2461.6 [1071/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_mem_inter_instance.cpp.o 2462.3 [1072/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_3.cpp.o 2462.4 [1073/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_4.cpp.o 2463.0 [1074/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_10.cpp.o 2463.1 [1075/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_13.cpp.o 2463.5 [1076/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_11.cpp.o 2463.7 [1077/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_8.cpp.o 2464.6 [1078/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_7.cpp.o 2464.8 [1079/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_9.cpp.o 2465.1 [1080/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_part2_instances_shard_2.cpp.o 2465.5 [1081/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_14.cpp.o 2465.6 [1082/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_part2_instances_shard_0.cpp.o 2465.6 [1083/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_5.cpp.o 2465.9 [1084/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_16x16_instances_shard_2.cpp.o 2466.1 [1085/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_15.cpp.o 2466.2 [1086/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_12.cpp.o 2468.4 [1087/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_16x16_instances_shard_1.cpp.o 2468.6 [1088/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_16x16_instances_shard_0.cpp.o 2469.2 [1089/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_16x16_instances.cpp.o 2469.3 [1090/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_0.cpp.o 2470.0 [1091/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_2.cpp.o 2470.6 [1092/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_2.cpp.o 2471.2 [1093/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_1.cpp.o 2471.5 [1094/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_10.cpp.o 2473.0 [1095/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_11.cpp.o 2473.9 [1096/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_6.cpp.o 2473.9 [1097/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_13.cpp.o 2475.1 [1098/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances.cpp.o 2475.5 [1099/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_5.cpp.o 2475.5 [1100/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_7.cpp.o 2475.7 [1101/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_8.cpp.o 2476.6 [1102/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_9.cpp.o 2477.1 [1103/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_3.cpp.o 2477.4 [1104/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_4.cpp.o 2477.4 [1105/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_bf16_instances.cpp.o 2477.4 [1106/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_14.cpp.o 2478.2 [1107/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_12.cpp.o 2478.7 [1108/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_5.cpp.o 2479.4 [1109/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f16_instances.cpp.o 2479.5 [1110/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_15.cpp.o 2481.3 [1111/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_4.cpp.o 2482.1 [1112/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f32_instances.cpp.o 2483.8 [1113/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances.cpp.o 2483.9 [1114/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instance.cpp.o 2484.3 [1115/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_6.cpp.o 2485.6 [1116/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_16x16_instances_shard_1.cpp.o 2486.3 [1117/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_16x16_instances_shard_2.cpp.o 2486.4 [1118/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_16x16_instances_shard_0.cpp.o 2488.8 [1119/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_mem_inter_instance.cpp.o 2491.5 [1120/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_11.cpp.o 2492.5 [1121/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_1.cpp.o 2493.3 [1122/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_2.cpp.o 2493.5 [1123/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_13.cpp.o 2493.8 [1124/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_6.cpp.o 2493.8 [1125/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_10.cpp.o 2494.8 [1126/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_15.cpp.o 2495.1 [1127/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_8.cpp.o 2495.1 [1128/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_12.cpp.o 2496.0 [1129/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_14.cpp.o 2497.1 [1130/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances.cpp.o 2497.4 [1131/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_7.cpp.o 2497.8 [1132/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_0.cpp.o 2498.3 [1133/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_9.cpp.o 2499.7 [1134/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_1.cpp.o 2499.8 [1135/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_4.cpp.o 2499.8 [1136/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_3.cpp.o 2500.0 [1137/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_2.cpp.o 2500.1 [1138/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_0.cpp.o 2500.3 [1139/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_2.cpp.o 2501.2 [1140/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_5.cpp.o 2503.4 [1141/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_1.cpp.o 2503.8 [1142/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_1.cpp.o 2504.4 [1143/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_1.cpp.o 2505.1 [1144/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_0.cpp.o 2505.7 [1145/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_2.cpp.o 2505.9 [1146/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_0.cpp.o 2506.0 [1147/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_0.cpp.o 2506.9 [1148/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/large_tensor/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_large_tensor_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_0.cpp.o 2507.4 [1149/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_1.cpp.o 2508.7 [1150/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_3.cpp.o 2510.6 [1151/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances.cpp.o 2515.6 [1152/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_12.cpp.o 2517.7 [1153/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_11.cpp.o 2518.6 [1154/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_0.cpp.o 2519.0 [1155/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_14.cpp.o 2520.3 [1156/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_13.cpp.o 2520.8 [1157/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_10.cpp.o 2522.4 [1158/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_9.cpp.o 2524.1 [1159/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_0.cpp.o 2524.2 [1160/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_2.cpp.o 2525.3 [1161/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_8.cpp.o 2526.2 [1162/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_1.cpp.o 2526.9 [1163/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_3.cpp.o 2526.9 [1164/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instance.cpp.o 2527.5 [1165/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_16.cpp.o 2527.8 [1166/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_15.cpp.o 2529.2 [1167/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_mem_inter_instance.cpp.o 2531.2 [1168/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_5.cpp.o 2531.7 [1169/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_comp_instance.cpp.o 2531.7 [1170/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_7.cpp.o 2532.7 [1171/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_12.cpp.o 2533.4 [1172/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_mem_intra_instance.cpp.o 2533.8 [1173/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_18.cpp.o 2534.0 [1174/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_19.cpp.o 2534.3 [1175/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances.cpp.o 2535.4 [1176/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_2.cpp.o 2535.7 [1177/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_13.cpp.o 2536.4 [1178/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_mem_inter_instance.cpp.o 2536.4 [1179/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_0.cpp.o 2536.6 [1180/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_3.cpp.o 2536.7 [1181/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_14.cpp.o 2537.5 [1182/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_17.cpp.o 2537.9 [1183/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_11.cpp.o 2538.0 [1184/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_10.cpp.o 2538.1 [1185/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_1.cpp.o 2538.3 [1186/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_6.cpp.o 2539.2 [1187/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instances_shard_4.cpp.o 2539.8 [1188/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_9.cpp.o 2540.1 [1189/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_8.cpp.o 2542.4 [1190/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_15.cpp.o 2543.2 [1191/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_mem_intra_instance.cpp.o 2543.8 [1192/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp32_tf32_mem_intra_instance.cpp.o 2544.8 [1193/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_7.cpp.o 2545.2 [1194/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_16.cpp.o 2546.6 [1195/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances.cpp.o 2547.9 [1196/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_5.cpp.o 2549.9 [1197/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_10.cpp.o 2550.0 [1198/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_18.cpp.o 2550.1 [1199/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_8.cpp.o 2550.8 [1200/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_17.cpp.o 2551.6 [1201/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_12.cpp.o 2551.7 [1202/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_19.cpp.o 2552.1 [1203/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_6.cpp.o 2552.2 [1204/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_9.cpp.o 2553.4 [1205/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instances_shard_4.cpp.o 2555.8 [1206/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_0.cpp.o 2555.9 [1207/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_11.cpp.o 2556.0 [1208/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_14.cpp.o 2556.3 [1209/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_13.cpp.o 2556.5 [1210/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_2.cpp.o 2557.6 [1211/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_5.cpp.o 2557.9 [1212/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_0.cpp.o 2559.2 [1213/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_0.cpp.o 2559.3 [1214/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_1.cpp.o 2559.6 [1215/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_3.cpp.o 2559.7 [1216/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances.cpp.o 2561.2 [1217/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_7.cpp.o 2563.2 [1218/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_15.cpp.o 2563.7 [1219/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_4.cpp.o 2565.9 [1220/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_6.cpp.o 2566.5 [1221/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_comp_part2_instances_shard_3.cpp.o 2567.6 [1222/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_16.cpp.o 2568.6 [1223/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_12.cpp.o 2568.7 [1224/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_3.cpp.o 2568.9 [1225/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances.cpp.o 2569.4 [1226/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_2.cpp.o 2570.5 [1227/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_0.cpp.o 2571.8 [1228/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_14.cpp.o 2571.9 [1229/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_1.cpp.o 2573.1 [1230/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_11.cpp.o 2573.7 [1231/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_13.cpp.o 2573.7 [1232/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_18.cpp.o 2573.7 [1233/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_10.cpp.o 2574.8 [1234/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_clamp_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instance.cpp.o 2575.5 [1235/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_9.cpp.o 2575.5 [1236/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_19.cpp.o 2575.7 [1237/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_8.cpp.o 2575.8 [1238/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_inter_instances_shard_17.cpp.o 2578.7 [1239/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_15.cpp.o 2579.5 [1240/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_5.cpp.o 2579.6 [1241/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_16.cpp.o 2580.2 [1242/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_11.cpp.o 2580.6 [1243/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/comp/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instances_shard_4.cpp.o 2580.9 [1244/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_10.cpp.o 2581.6 [1245/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_8.cpp.o 2582.3 [1246/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances.cpp.o 2582.6 [1247/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_3.cpp.o 2583.0 [1248/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_2.cpp.o 2585.1 [1249/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_7.cpp.o 2585.5 [1250/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_17.cpp.o 2585.9 [1251/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_0.cpp.o 2586.3 [1252/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_19.cpp.o 2586.6 [1253/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_1.cpp.o 2586.7 [1254/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_18.cpp.o 2587.5 [1255/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_9.cpp.o 2588.2 [1256/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_12.cpp.o 2588.5 [1257/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_6.cpp.o 2588.7 [1258/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_4.cpp.o 2590.4 [1259/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_7.cpp.o 2591.4 [1260/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_10.cpp.o 2591.9 [1261/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_11.cpp.o 2592.8 [1262/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_8.cpp.o 2592.9 [1263/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_13.cpp.o 2593.5 [1264/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f16_mem_intra_instances_shard_6.cpp.o 2593.6 [1265/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_0.cpp.o 2594.7 [1266/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances.cpp.o 2595.5 [1267/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_bf16_instances.cpp.o 2596.2 [1268/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_2.cpp.o 2597.5 [1269/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_1.cpp.o 2597.7 [1270/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_12.cpp.o 2598.7 [1271/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f16_instances.cpp.o 2599.3 [1272/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_14.cpp.o 2599.7 [1273/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_3.cpp.o 2604.8 [1274/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_instances.cpp.o 2606.7 [1275/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_9.cpp.o 2607.0 [1276/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_15.cpp.o 2607.1 [1277/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_7.cpp.o 2607.7 [1278/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_5.cpp.o 2608.1 [1279/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances.cpp.o 2609.6 [1280/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_6.cpp.o 2612.2 [1281/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_13.cpp.o 2613.4 [1282/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_2.cpp.o 2613.5 [1283/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_8.cpp.o 2613.6 [1284/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_11.cpp.o 2614.8 [1285/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_10.cpp.o 2616.0 [1286/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_inter_instances_shard_4.cpp.o 2616.3 [1287/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_3.cpp.o 2616.3 [1288/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_0.cpp.o 2617.3 [1289/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_14.cpp.o 2618.8 [1290/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_1.cpp.o 2625.2 [1291/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_9.cpp.o 2626.5 [1292/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_12.cpp.o 2627.3 [1293/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_mem_inter_instance.cpp.o 2627.8 [1294/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_7.cpp.o 2633.5 [1295/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_8.cpp.o 2634.3 [1296/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_11.cpp.o 2634.7 [1297/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_inter_instance.cpp.o 2634.8 [1298/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_10.cpp.o 2636.5 [1299/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_6.cpp.o 2637.2 [1300/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_5.cpp.o 2638.3 [1301/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_15.cpp.o 2641.5 [1302/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_13.cpp.o 2643.3 [1303/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_12.cpp.o 2644.6 [1304/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_14.cpp.o 2647.3 [1305/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_mem_intra_instances_shard_4.cpp.o 2648.0 [1306/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_7.cpp.o 2649.1 [1307/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_9.cpp.o 2653.1 [1308/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_13.cpp.o 2653.5 [1309/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_6.cpp.o 2655.0 [1310/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_2.cpp.o 2656.1 [1311/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_0.cpp.o 2658.4 [1312/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_5.cpp.o 2659.4 [1313/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_2.cpp.o 2659.7 [1314/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_instances_shard_1.cpp.o 2660.4 [1315/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_15.cpp.o 2661.6 [1316/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_14.cpp.o 2661.7 [1317/1431] cd /__w/rockrel/rockrel/build/ml-libs/composable_kernel/build && /usr/local/therock-tools/bin/cmake -E rm -f /__w/rockrel/rockrel/build/ml-libs/composable_kernel/stamp/stage.stamp 2663.6 [1318/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_0.cpp.o 2663.8 [1319/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_mem_intra_instance.cpp.o 2666.8 [1320/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instances_shard_1.cpp.o 2667.6 [1321/1431] Building CXX object library/src/utility/CMakeFiles/utility.dir/device_memory.cpp.o 2668.7 [1322/1431] Linking CXX static library lib/libdevice_contraction_operations.a 2668.8 [1323/1431] Linking CXX static library lib/libdevice_other_operations.a 2671.0 [1324/1431] Building CXX object library/src/utility/CMakeFiles/utility.dir/convolution_parameter.cpp.o 2671.3 [1325/1431] Building CXX object library/src/utility/CMakeFiles/utility.dir/host_tensor.cpp.o 2672.3 [1326/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_inter_instances_shard_4.cpp.o 2677.9 [1327/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_5.cpp.o 2679.8 [1328/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/mem/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_mem_intra_instance.cpp.o 2686.6 [1329/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_15.cpp.o 2688.4 [1330/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/mem/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_f32_tf32_mem_intra_instances_shard_4.cpp.o 2705.2 [1331/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_1.cpp.o 2713.6 [1332/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_2.cpp.o 2725.7 [1333/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_2.cpp.o 2727.3 [1334/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_reduce/CMakeFiles/device_gemm_reduce_instance.dir/device_gemm_reduce_xdl_cshuffle_f16_f16_f16_f32_f32_mk_kn_mn_instance.cpp.o 2727.3 [1335/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_1.cpp.o 2732.8 [1336/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_dynamic_op/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_dynamic_op_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_dynamic_op_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2732.8 [1337/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2739.6 [1338/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_scale_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2756.0 [1339/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_dynamic_op/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_dynamic_op_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_dynamic_op_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2757.8 [1340/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_dynamic_op/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_dynamic_op_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_dynamic_op_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2761.7 [1341/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_bf16_instances_shard_0.cpp.o 2762.2 [1342/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scaleadd_ab/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scaleadd_ab_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scaleadd_ab_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2769.0 [1343/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scaleadd_scaleadd_relu/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scaleadd_scaleadd_relu_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scaleadd_scaleadd_relu_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2769.2 [1344/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_bnorm_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_bnorm_clamp_ndhwgc_instance.dir/generated/xdl/merged_groups/device_grouped_conv3d_fwd_bias_bn_clamp_xdl_merged_groups_ndhwgc_gkzyxc_ndhwgk_f16_instances_shard_0.cpp.o 2779.8 [1345/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_dynamic_op/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_dynamic_op_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_dynamic_op_ndhwgc_gkzyxc_ndhwgk_int8_instance.cpp.o 2782.8 [1346/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scaleadd_ab/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scaleadd_ab_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scaleadd_ab_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2798.8 [1347/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scaleadd_scaleadd_relu/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scaleadd_scaleadd_relu_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scaleadd_scaleadd_relu_ndhwgc_gkzyxc_ndhwgk_int8_instance.cpp.o 2800.4 [1348/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scaleadd_scaleadd_relu/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scaleadd_scaleadd_relu_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scaleadd_scaleadd_relu_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2801.0 [1349/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_bias_add_reduce/CMakeFiles/device_gemm_bias_add_reduce_instance.dir/device_gemm_bias_add_mean_squaremean_xdl_cshuffle_f16_f16_f16_f32_f32_mk_nk_mn_instance.cpp.o 2802.6 [1350/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scaleadd_scaleadd_relu/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scaleadd_scaleadd_relu_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scaleadd_scaleadd_relu_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2807.3 [1351/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scaleadd_ab/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scaleadd_ab_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scaleadd_ab_ndhwgc_gkzyxc_ndhwgk_int8_instance.cpp.o 2808.1 [1352/1431] Building CXX object library/src/tensor_operation_instance/gpu/batched_gemm_reduce/CMakeFiles/device_batched_gemm_reduce_instance.dir/device_batched_gemm_reduce_xdl_cshuffle_f16_f16_f16_f32_f32_gmk_gnk_gmn_instance.cpp.o 2823.5 [1353/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_reduce/CMakeFiles/device_gemm_reduce_instance.dir/device_gemm_reduce_xdl_cshuffle_f16_f16_f16_f32_f32_mk_nk_mn_instance.cpp.o 2826.1 [1354/1431] Building CXX object library/src/tensor_operation_instance/gpu/batched_gemm_reduce/CMakeFiles/device_batched_gemm_reduce_instance.dir/device_batched_gemm_reduce_xdl_cshuffle_f16_f16_f16_f32_f32_gkm_gkn_gmn_instance.cpp.o 2826.8 [1355/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_scaleadd_ab/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_scaleadd_ab_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_scaleadd_ab_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2851.1 [1356/1431] Building CXX object library/src/tensor_operation_instance/gpu/batched_gemm_reduce/CMakeFiles/device_batched_gemm_reduce_instance.dir/device_batched_gemm_reduce_xdl_cshuffle_f16_f16_f16_f32_f32_gmk_gkn_gmn_instance.cpp.o 2859.5 [1357/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2861.1 [1358/1431] Building CXX object library/src/tensor_operation_instance/gpu/batched_gemm_reduce/CMakeFiles/device_batched_gemm_reduce_instance.dir/device_batched_gemm_reduce_xdl_cshuffle_f16_f16_f16_f32_f32_gkm_gnk_gmn_instance.cpp.o 2864.6 [1359/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 2869.0 [1360/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_bias_add_reduce/CMakeFiles/device_gemm_bias_add_reduce_instance.dir/device_gemm_bias_add_mean_squaremean_xdl_cshuffle_f16_f16_f16_f32_f32_km_nk_mn_instance.cpp.o 2884.9 [1361/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_reduce/CMakeFiles/device_gemm_reduce_instance.dir/device_gemm_reduce_xdl_cshuffle_f16_f16_f16_f32_f32_km_nk_mn_instance.cpp.o 2887.8 [1362/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_bias_add_reduce/CMakeFiles/device_gemm_bias_add_reduce_instance.dir/device_gemm_bias_add_mean_squaremean_xdl_cshuffle_f16_f16_f16_f32_f32_mk_kn_mn_instance.cpp.o 2892.1 [1363/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_reduce/CMakeFiles/device_gemm_reduce_instance.dir/device_gemm_reduce_xdl_cshuffle_f16_f16_f16_f32_f32_km_kn_mn_instance.cpp.o 2893.4 [1364/1431] Linking CXX static library lib/libdevice_reduction_operations.a 2893.5 [1365/1431] Linking CXX static library lib/libutility.a 2896.8 [1366/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convscale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convscale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_combconvscale_ndhwgc_gkzyxc_ndhwgk_f8_f8_f32_instance.cpp.o 2900.1 [1367/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convscale_relu/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convscale_relu_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_convscale_relu_ndhwgc_gkzyxc_ndhwgk_f8_instance.cpp.o 2902.0 [1368/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_bias_add_reduce/CMakeFiles/device_gemm_bias_add_reduce_instance.dir/device_gemm_bias_add_mean_squaremean_xdl_cshuffle_f16_f16_f16_f32_f32_km_kn_mn_instance.cpp.o 2904.7 [1369/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convinvscale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convinvscale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_convinvscale_ndhwgc_gkzyxc_ndhwgk_f8_instance.cpp.o 2907.8 [1370/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convscale_relu/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convscale_relu_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_combconvscale_relu_ndhwgc_gkzyxc_ndhwgk_f8_f8_f32_instance.cpp.o 2910.5 [1371/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convscale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convscale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_convscale_ndhwgc_gkzyxc_ndhwgk_bf8_f8_instance.cpp.o 2911.5 [1372/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convscale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convscale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_convscale_ndhwgc_gkzyxc_ndhwgk_f8_instance.cpp.o 2912.0 [1373/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_int8_instance.cpp.o 2914.2 [1374/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 2916.9 [1375/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2917.2 [1376/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convscale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convscale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_convscale_ndhwgc_gkzyxc_ndhwgk_bf8_instance.cpp.o 2924.1 [1377/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_fp16_comp_instance.cpp.o 2933.2 [1378/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convscale/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convscale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_convscale_ndhwgc_gkzyxc_ndhwgk_f8_bf8_instance.cpp.o 2941.9 [1379/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_convscale_add/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_convscale_add_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_convscale_add_ndhwgc_gkzyxc_ndhwgk_f8_instance.cpp.o 2942.2 [1380/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 2946.0 [1381/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 2948.7 [1382/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_fwd_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 2960.1 [1383/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f16_comp_bf8_fp8_instance.cpp.o 2965.1 [1384/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_scale_ndhwgc_gkzyxc_ndhwgk_bf16_f32_bf16_instance.cpp.o 3033.0 [1385/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 3035.2 [1386/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_i8_bf16/device_gemm_xdl_universal_bf16_i8_bf16_mk_kn_mn_mem_v2_kpadding_instance.cpp.o 3040.1 [1387/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 3041.2 [1388/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_i8_bf16/device_gemm_xdl_universal_bf16_i8_bf16_mk_kn_mn_mem_v2_default_instance.cpp.o 3052.0 [1389/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_i8_bf16/device_gemm_xdl_universal_bf16_i8_bf16_mk_kn_mn_mem_v2_mnkpadding_instance.cpp.o 3061.5 [1390/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_i8_bf16/device_gemm_xdl_universal_bf16_i8_bf16_mk_kn_mn_comp_mnpadding_instance.cpp.o 3066.7 [1391/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_bf16_bf16/device_gemm_xdl_universal_bf16_bf16_bf16_mk_kn_mn_comp_mnpadding_instance.cpp.o 3070.3 [1392/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_bf16_bf16/device_gemm_xdl_universal_bf16_bf16_bf16_mk_kn_mn_comp_kpadding_instance.cpp.o 3071.0 [1393/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_bf16_bf16/device_gemm_xdl_universal_bf16_bf16_bf16_mk_kn_mn_comp_mnkpadding_instance.cpp.o 3071.0 [1394/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_i8_bf16/device_gemm_xdl_universal_bf16_i8_bf16_mk_kn_mn_comp_kpadding_instance.cpp.o 3072.6 [1395/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_i8_bf16/device_gemm_xdl_universal_bf16_i8_bf16_mk_kn_mn_comp_default_instance.cpp.o 3072.8 [1396/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_bf16_f32_bf16_instance.cpp.o 3076.4 [1397/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_bf16_bf16/device_gemm_xdl_universal_bf16_bf16_bf16_mk_kn_mn_comp_default_instance.cpp.o 3080.6 [1398/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 3087.9 [1399/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_scale_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 3095.1 [1400/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 3097.3 [1401/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_comp_mnkpadding_instance.cpp.o 3097.4 [1402/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_comp_default_instance.cpp.o 3098.5 [1403/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f16_comp_bf8_fp8_instance.cpp.o 3099.2 [1404/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_comp_kpadding_instance.cpp.o 3100.8 [1405/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_i8_bf16/device_gemm_xdl_universal_bf16_i8_bf16_mk_kn_mn_comp_mnkpadding_instance.cpp.o 3103.1 [1406/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_comp_mnpadding_instance.cpp.o 3110.5 [1407/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_weight_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_weight_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_weight_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 3117.7 [1408/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data_scale/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_scale_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_scale_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 3118.1 [1409/1431] Building CXX object library/src/tensor_operation_instance/gpu/quantization/CMakeFiles/device_quantization_instance.dir/gemm/device_gemm_quantization_xdl_c_shuffle_i8_i8_i8_km_nk_mn_instance.cpp.o 3121.1 [1410/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f16_instance.cpp.o 3129.1 [1411/1431] Building CXX object library/src/tensor_operation_instance/gpu/quantization/CMakeFiles/device_quantization_instance.dir/gemm/device_gemm_quantization_xdl_c_shuffle_i8_i8_i8_mk_nk_mn_instance.cpp.o 3132.1 [1412/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f32_instance.cpp.o 3135.9 [1413/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_f32_tf32_instance.cpp.o 3139.3 [1414/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_bf16_bf16/device_gemm_xdl_universal_bf16_bf16_bf16_mk_kn_mn_mem_v2_default_instance.cpp.o 3139.7 [1415/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_fwd_bias_clamp/ndhwgc/CMakeFiles/device_grouped_conv3d_fwd_bias_clamp_ndhwgc_instance.dir/xdl/comp/device_grouped_conv3d_fwd_bias_clamp_xdl_ndhwgc_gkzyxc_ndhwgk_bf16_comp_instance.cpp.o 3143.0 [1416/1431] Building CXX object library/src/tensor_operation_instance/gpu/quantization/CMakeFiles/device_quantization_instance.dir/conv2d_fwd/device_conv2d_xdl_perlayer_quantization_int8_instance.cpp.o 3143.9 [1417/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_bf16_bf16/device_gemm_xdl_universal_bf16_bf16_bf16_mk_kn_mn_mem_v2_mnkpadding_instance.cpp.o 3149.9 [1418/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_bf16_bf16_bf16/device_gemm_xdl_universal_bf16_bf16_bf16_mk_kn_mn_mem_v2_kpadding_instance.cpp.o 3152.4 [1419/1431] Building CXX object library/src/tensor_operation_instance/gpu/quantization/CMakeFiles/device_quantization_instance.dir/gemm/device_gemm_quantization_xdl_c_shuffle_i8_i8_i8_mk_kn_mn_instance.cpp.o 3153.4 [1420/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_mem_v1_kpadding_instance.cpp.o 3153.6 [1421/1431] Building CXX object library/src/tensor_operation_instance/gpu/quantization/CMakeFiles/device_quantization_instance.dir/conv2d_fwd/device_conv2d_xdl_perchannel_quantization_int8_instance.cpp.o 3158.7 [1422/1431] Building CXX object library/src/tensor_operation_instance/gpu/quantization/CMakeFiles/device_quantization_instance.dir/gemm/device_gemm_quantization_xdl_c_shuffle_i8_i8_i8_km_kn_mn_instance.cpp.o 3163.2 [1423/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_mem_v2_default_instance.cpp.o 3165.0 [1424/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_mem_v1_default_instance.cpp.o 3166.4 [1425/1431] Building CXX object library/src/tensor_operation_instance/gpu/grouped_conv3d_bwd_data_bilinear/ndhwgc/CMakeFiles/device_grouped_conv3d_bwd_data_bilinear_ndhwgc_instance.dir/xdl/device_grouped_conv3d_bwd_data_xdl_bilinear_ndhwgc_gkzyxc_ndhwgk_bf16_instance.cpp.o 3169.0 [1426/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_mem_v2_kpadding_instance.cpp.o 3169.5 [1427/1431] Linking CXX static library lib/libdevice_conv_operations.a 3171.2 [1428/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_mem_v1_mnkpadding_instance.cpp.o 3173.1 [1429/1431] Building CXX object library/src/tensor_operation_instance/gpu/gemm_universal_reduce/CMakeFiles/device_gemm_universal_reduce_instance.dir/device_gemm_xdl_universal_f16_f16_f16/device_gemm_xdl_universal_f16_f16_f16_mk_kn_mn_mem_v2_mnkpadding_instance.cpp.o 3242.2 [1430/1431] Building CXX object library/src/tensor_operation_instance/gpu/quantization/CMakeFiles/device_quantization_instance.dir/conv2d_fwd/device_conv2d_xdl_bias_perlayer_quantization_int8_instance.cpp.o 3261.5 [1431/1431] Building CXX object library/src/tensor_operation_instance/gpu/quantization/CMakeFiles/device_quantization_instance.dir/conv2d_fwd/device_conv2d_xdl_bias_perchannel_quantization_int8_instance.cpp.o END 1782128929.2844563 3261.4763827323914 0